{
  "nbformat": 4,
  "nbformat_minor": 0,
  "metadata": {
    "colab": {
      "provenance": [],
      "collapsed_sections": []
    },
    "kernelspec": {
      "name": "python3",
      "display_name": "Python 3"
    },
    "language_info": {
      "name": "python"
    }
  },
  "cells": [
    {
      "cell_type": "markdown",
      "source": [
        "[<img align=\"left\" src=\"https://colab.research.google.com/assets/colab-badge.svg\">](https://colab.research.google.com/github/sail-sg/envpool/blob/main/demo/envpool_demo_breakout.ipynb)"
      ],
      "metadata": {
        "id": "3XJJ0SaDUeoR"
      }
    },
    {
      "cell_type": "code",
      "execution_count": null,
      "metadata": {
        "id": "lIyDa5q_zWih"
      },
      "outputs": [],
      "source": [
        "# OS: Ubuntu 18.04.4 LTS x86_64\n",
        "# Kernel: 4.18.0-15-generic\n",
        "# CPU: Intel(R) Core(TM) i9-10920X CPU (24) @ 3.50GHz\n",
        "# GPU: NVIDIA GeForce RTX 2080 Ti\n",
        "!apt-get install -y \\\n",
        "    libgl1-mesa-dev \\\n",
        "    libgl1-mesa-glx \\\n",
        "    libglew-dev \\\n",
        "    libosmesa6-dev \\\n",
        "    software-properties-common\n",
        "\n",
        "!apt-get install -y patchelf\n",
        "!pip install git+https://github.com/Denys88/rl_games\n",
        "!pip install envpool\n",
        "!pip install gym\n",
        "\n",
        "!pip install free-mujoco-py\n",
        "!apt-get install -y xvfb python-opengl ffmpeg > /dev/null 2>&1\n",
        "!pip install imageio==2.4.1\n",
        "!pip install -U colabgymrender"
      ]
    },
    {
      "cell_type": "code",
      "source": [
        "from rl_games.torch_runner import Runner"
      ],
      "metadata": {
        "id": "LTVQdyGO0TA3"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "## breakout_envpool config:\n",
        "breakout_config = {'params': {'algo': {'name': 'a2c_discrete'}, \n",
        "                              'model': {'name': 'discrete_a2c'}, \n",
        "                              'network': {'name': 'actor_critic', \n",
        "                                          'separate': False, \n",
        "                                          'space': {'discrete': None}, \n",
        "                                          'cnn': {'permute_input': False, \n",
        "                                                  'type': 'conv2d', \n",
        "                                                  'activation': 'relu', \n",
        "                                                  'initializer': {'name': 'orthogonal_initializer', 'gain': 1.41421356237}, \n",
        "                                                  'convs': [{'filters': 32, 'kernel_size': 8, 'strides': 4, 'padding': 0}, \n",
        "                                                            {'filters': 64, 'kernel_size': 4, 'strides': 2, 'padding': 0}, \n",
        "                                                            {'filters': 64, 'kernel_size': 3, 'strides': 1, 'padding': 0}]}, \n",
        "                                          'mlp': {'units': [512], 'activation': 'relu', 'initializer': {'name': 'orthogonal_initializer', 'gain': 1.41421356237}}}, \n",
        "                              'config': {'name': 'Breakout_envpool', \n",
        "                                          'env_name': 'envpool', \n",
        "                                          'score_to_win': 900, \n",
        "                                          'normalize_value': True, \n",
        "                                          'normalize_input': False, \n",
        "                                          'reward_shaper': {'scale_value': 1}, \n",
        "                                          'normalize_advantage': True, \n",
        "                                          'gamma': 0.999, \n",
        "                                          'tau': 0.95, \n",
        "                                          'learning_rate': '8e-4', \n",
        "                                          'lr_schedule': 'None', \n",
        "                                          'kl_threshold': 0.01, \n",
        "                                          'grad_norm': 1.0, \n",
        "                                          'entropy_coef': 0.01, \n",
        "                                          'truncate_grads': True, \n",
        "                                          'e_clip': 0.2, \n",
        "                                          'clip_value': False, \n",
        "                                          'num_actors': 64, \n",
        "                                          'horizon_length': 128, \n",
        "                                          'minibatch_size': 1024, \n",
        "                                          'mini_epochs': 2, \n",
        "                                          'critic_coef': 1, \n",
        "                                          'max_epochs': 1500, \n",
        "                                          'env_config': {'env_name': 'Breakout-v5', 'episodic_life': True, 'has_lives': True}, \n",
        "                                          'player': {'render': False, 'games_num': 200, 'n_game_life': 5, 'determenistic': False}}}}"
      ],
      "metadata": {
        "id": "76pPi11m0Uv1"
      },
      "execution_count": null,
      "outputs": []
    },
    {
      "cell_type": "code",
      "source": [
        "runner = Runner()\n",
        "runner.load(breakout_config)\n",
        "runner.run({\n",
        "    'train': True,\n",
        "})"
      ],
      "metadata": {
        "colab": {
          "base_uri": "https://localhost:8080/"
        },
        "id": "uMH9k4b13h-Y",
        "outputId": "6da13308-00de-46b6-c61f-d64be6a8de9a"
      },
      "execution_count": null,
      "outputs": [
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "self.seed = 1655992919\n",
            "Started to train\n",
            "current training device: cuda:0\n",
            "conv_name: conv2d\n",
            "build mlp: 3136\n",
            "RunningMeanStd:  (1,)\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stderr",
          "text": [
            "/home/liubo/.local/lib/python3.8/site-packages/rl_games/common/experience.py:341: DeprecationWarning: `np.long` is a deprecated alias for `np.compat.long`. To silence this warning, use `np.compat.long` by itself. In the likely event your code does not need to work on Python 2 you can use the builtin `int` for which `np.compat.long` is itself an alias. Doing this will not modify any behaviour and is safe. When replacing `np.long`, you may wish to use e.g. `np.int64` or `np.int32` to specify the precision. If you wish to review your current use, check the release note link for additional information.\n",
            "Deprecated in NumPy 1.20; for more details and guidance: https://numpy.org/devdocs/release/1.20.0-notes.html#deprecations\n",
            "  self.tensor_dict['actions'] = self._create_tensor_from_space(gym.spaces.Box(low=0, high=1,shape=self.actions_shape, dtype=np.long), obs_base_shape)\n"
          ]
        },
        {
          "output_type": "stream",
          "name": "stdout",
          "text": [
            "fps step: 10570 fps step and policy inference: 8468 fps total: 6379 epoch: 1/1500\n",
            "fps step: 6256 fps step and policy inference: 5105 fps total: 4586 epoch: 2/1500\n",
            "fps step: 5151 fps step and policy inference: 4203 fps total: 3778 epoch: 3/1500\n",
            "fps step: 4585 fps step and policy inference: 3745 fps total: 3404 epoch: 4/1500\n",
            "fps step: 4710 fps step and policy inference: 3887 fps total: 3518 epoch: 5/1500\n",
            "fps step: 4352 fps step and policy inference: 3540 fps total: 3244 epoch: 6/1500\n",
            "fps step: 4295 fps step and policy inference: 3417 fps total: 3137 epoch: 7/1500\n",
            "fps step: 4633 fps step and policy inference: 3813 fps total: 3458 epoch: 8/1500\n",
            "fps step: 4562 fps step and policy inference: 3699 fps total: 3374 epoch: 9/1500\n",
            "fps step: 4451 fps step and policy inference: 3580 fps total: 3263 epoch: 10/1500\n",
            "fps step: 4653 fps step and policy inference: 3708 fps total: 3369 epoch: 11/1500\n",
            "fps step: 4603 fps step and policy inference: 3745 fps total: 3402 epoch: 12/1500\n",
            "fps step: 4949 fps step and policy inference: 4032 fps total: 3646 epoch: 13/1500\n",
            "fps step: 4866 fps step and policy inference: 3908 fps total: 3536 epoch: 14/1500\n",
            "fps step: 4718 fps step and policy inference: 3848 fps total: 3508 epoch: 15/1500\n",
            "fps step: 5238 fps step and policy inference: 4213 fps total: 3794 epoch: 16/1500\n",
            "fps step: 5145 fps step and policy inference: 4150 fps total: 3740 epoch: 17/1500\n",
            "fps step: 4542 fps step and policy inference: 3666 fps total: 3352 epoch: 18/1500\n",
            "fps step: 5430 fps step and policy inference: 4382 fps total: 3919 epoch: 19/1500\n",
            "fps step: 5162 fps step and policy inference: 4199 fps total: 3786 epoch: 20/1500\n",
            "fps step: 5189 fps step and policy inference: 4263 fps total: 3835 epoch: 21/1500\n",
            "fps step: 5487 fps step and policy inference: 4460 fps total: 4008 epoch: 22/1500\n",
            "fps step: 5124 fps step and policy inference: 4139 fps total: 3748 epoch: 23/1500\n",
            "fps step: 5140 fps step and policy inference: 4215 fps total: 3788 epoch: 24/1500\n",
            "fps step: 5337 fps step and policy inference: 4364 fps total: 3919 epoch: 25/1500\n",
            "fps step: 5278 fps step and policy inference: 4314 fps total: 3861 epoch: 26/1500\n",
            "fps step: 6026 fps step and policy inference: 4889 fps total: 4404 epoch: 27/1500\n",
            "fps step: 5239 fps step and policy inference: 4216 fps total: 3797 epoch: 28/1500\n",
            "fps step: 5334 fps step and policy inference: 4353 fps total: 3898 epoch: 29/1500\n",
            "fps step: 5727 fps step and policy inference: 4572 fps total: 4112 epoch: 30/1500\n",
            "fps step: 5334 fps step and policy inference: 4269 fps total: 3837 epoch: 31/1500\n",
            "fps step: 5460 fps step and policy inference: 4324 fps total: 3873 epoch: 32/1500\n",
            "fps step: 5663 fps step and policy inference: 4545 fps total: 4053 epoch: 33/1500\n",
            "fps step: 6123 fps step and policy inference: 5012 fps total: 4507 epoch: 34/1500\n",
            "fps step: 5270 fps step and policy inference: 4243 fps total: 3808 epoch: 35/1500\n",
            "fps step: 6078 fps step and policy inference: 5046 fps total: 4534 epoch: 36/1500\n",
            "fps step: 5839 fps step and policy inference: 4791 fps total: 4325 epoch: 37/1500\n",
            "fps step: 5797 fps step and policy inference: 4618 fps total: 4120 epoch: 38/1500\n",
            "fps step: 5706 fps step and policy inference: 4638 fps total: 4125 epoch: 39/1500\n",
            "fps step: 5797 fps step and policy inference: 4683 fps total: 4167 epoch: 40/1500\n",
            "fps step: 6208 fps step and policy inference: 5085 fps total: 4566 epoch: 41/1500\n",
            "fps step: 5657 fps step and policy inference: 4566 fps total: 4074 epoch: 42/1500\n",
            "fps step: 5616 fps step and policy inference: 4534 fps total: 4043 epoch: 43/1500\n",
            "fps step: 6515 fps step and policy inference: 5398 fps total: 4814 epoch: 44/1500\n",
            "fps step: 6311 fps step and policy inference: 5061 fps total: 4545 epoch: 45/1500\n",
            "fps step: 5883 fps step and policy inference: 4792 fps total: 4327 epoch: 46/1500\n",
            "fps step: 5655 fps step and policy inference: 4467 fps total: 4003 epoch: 47/1500\n",
            "fps step: 6238 fps step and policy inference: 5053 fps total: 4540 epoch: 48/1500\n",
            "fps step: 6486 fps step and policy inference: 5281 fps total: 4722 epoch: 49/1500\n",
            "fps step: 6119 fps step and policy inference: 4994 fps total: 4492 epoch: 50/1500\n",
            "fps step: 5720 fps step and policy inference: 4509 fps total: 4028 epoch: 51/1500\n",
            "fps step: 6326 fps step and policy inference: 5135 fps total: 4605 epoch: 52/1500\n",
            "fps step: 6715 fps step and policy inference: 5437 fps total: 4842 epoch: 53/1500\n",
            "fps step: 5694 fps step and policy inference: 4564 fps total: 4137 epoch: 54/1500\n",
            "fps step: 6665 fps step and policy inference: 5458 fps total: 4868 epoch: 55/1500\n",
            "fps step: 6058 fps step and policy inference: 4906 fps total: 4414 epoch: 56/1500\n",
            "fps step: 6244 fps step and policy inference: 5040 fps total: 4533 epoch: 57/1500\n",
            "fps step: 7124 fps step and policy inference: 5816 fps total: 5145 epoch: 58/1500\n",
            "fps step: 6160 fps step and policy inference: 5030 fps total: 4520 epoch: 59/1500\n",
            "fps step: 6995 fps step and policy inference: 5669 fps total: 5032 epoch: 60/1500\n",
            "fps step: 5875 fps step and policy inference: 4721 fps total: 4192 epoch: 61/1500\n",
            "fps step: 6176 fps step and policy inference: 5014 fps total: 4506 epoch: 62/1500\n",
            "fps step: 6189 fps step and policy inference: 4998 fps total: 4493 epoch: 63/1500\n",
            "fps step: 6234 fps step and policy inference: 4946 fps total: 4451 epoch: 64/1500\n",
            "fps step: 6176 fps step and policy inference: 4880 fps total: 4326 epoch: 65/1500\n",
            "fps step: 6160 fps step and policy inference: 4857 fps total: 4379 epoch: 66/1500\n",
            "fps step: 6672 fps step and policy inference: 5447 fps total: 4856 epoch: 67/1500\n",
            "fps step: 6433 fps step and policy inference: 5146 fps total: 4611 epoch: 68/1500\n",
            "fps step: 6169 fps step and policy inference: 5020 fps total: 4511 epoch: 69/1500\n",
            "fps step: 6116 fps step and policy inference: 4815 fps total: 4344 epoch: 70/1500\n",
            "fps step: 6763 fps step and policy inference: 5397 fps total: 4812 epoch: 71/1500\n",
            "fps step: 6104 fps step and policy inference: 4990 fps total: 4487 epoch: 72/1500\n",
            "fps step: 6465 fps step and policy inference: 5282 fps total: 4723 epoch: 73/1500\n",
            "fps step: 6108 fps step and policy inference: 4919 fps total: 4409 epoch: 74/1500\n",
            "fps step: 6285 fps step and policy inference: 5154 fps total: 4616 epoch: 75/1500\n",
            "fps step: 6988 fps step and policy inference: 5584 fps total: 4962 epoch: 76/1500\n",
            "fps step: 6018 fps step and policy inference: 4914 fps total: 4423 epoch: 77/1500\n",
            "fps step: 6916 fps step and policy inference: 5665 fps total: 5026 epoch: 78/1500\n",
            "fps step: 6665 fps step and policy inference: 5375 fps total: 4795 epoch: 79/1500\n",
            "fps step: 5935 fps step and policy inference: 4719 fps total: 4266 epoch: 80/1500\n",
            "fps step: 7243 fps step and policy inference: 5940 fps total: 5242 epoch: 81/1500\n",
            "fps step: 6664 fps step and policy inference: 5535 fps total: 4924 epoch: 82/1500\n",
            "fps step: 6697 fps step and policy inference: 5432 fps total: 4843 epoch: 83/1500\n",
            "fps step: 6666 fps step and policy inference: 5429 fps total: 4841 epoch: 84/1500\n",
            "fps step: 7193 fps step and policy inference: 5761 fps total: 5089 epoch: 85/1500\n",
            "fps step: 7659 fps step and policy inference: 6317 fps total: 5535 epoch: 86/1500\n",
            "fps step: 6390 fps step and policy inference: 5071 fps total: 4544 epoch: 87/1500\n",
            "fps step: 7256 fps step and policy inference: 5936 fps total: 5239 epoch: 88/1500\n",
            "fps step: 6280 fps step and policy inference: 5066 fps total: 4546 epoch: 89/1500\n",
            "fps step: 7629 fps step and policy inference: 6175 fps total: 5423 epoch: 90/1500\n",
            "fps step: 6391 fps step and policy inference: 5353 fps total: 4779 epoch: 91/1500\n",
            "fps step: 7609 fps step and policy inference: 6225 fps total: 5460 epoch: 92/1500\n",
            "fps step: 6983 fps step and policy inference: 5719 fps total: 5068 epoch: 93/1500\n",
            "fps step: 5632 fps step and policy inference: 4472 fps total: 4012 epoch: 94/1500\n",
            "fps step: 6746 fps step and policy inference: 5295 fps total: 4733 epoch: 95/1500\n",
            "fps step: 6589 fps step and policy inference: 5298 fps total: 4722 epoch: 96/1500\n",
            "fps step: 6488 fps step and policy inference: 5231 fps total: 4677 epoch: 97/1500\n",
            "fps step: 7027 fps step and policy inference: 5642 fps total: 5005 epoch: 98/1500\n",
            "fps step: 6535 fps step and policy inference: 5319 fps total: 4751 epoch: 99/1500\n",
            "fps step: 7081 fps step and policy inference: 5729 fps total: 5075 epoch: 100/1500\n",
            "saving next best rewards:  [3.3788164]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 6777 fps step and policy inference: 5454 fps total: 4845 epoch: 101/1500\n",
            "fps step: 6139 fps step and policy inference: 4923 fps total: 4436 epoch: 102/1500\n",
            "fps step: 5874 fps step and policy inference: 4709 fps total: 4194 epoch: 103/1500\n",
            "saving next best rewards:  [3.4591439]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7791 fps step and policy inference: 6343 fps total: 5550 epoch: 104/1500\n",
            "fps step: 7182 fps step and policy inference: 5891 fps total: 5201 epoch: 105/1500\n",
            "saving next best rewards:  [3.484466]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 6962 fps step and policy inference: 5708 fps total: 5058 epoch: 106/1500\n",
            "saving next best rewards:  [3.514262]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7590 fps step and policy inference: 6162 fps total: 5412 epoch: 107/1500\n",
            "saving next best rewards:  [3.7745383]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 6263 fps step and policy inference: 4969 fps total: 4388 epoch: 108/1500\n",
            "saving next best rewards:  [3.9690695]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 6568 fps step and policy inference: 5290 fps total: 4727 epoch: 109/1500\n",
            "saving next best rewards:  [3.978831]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7009 fps step and policy inference: 5568 fps total: 4948 epoch: 110/1500\n",
            "fps step: 6523 fps step and policy inference: 5146 fps total: 4609 epoch: 111/1500\n",
            "fps step: 6414 fps step and policy inference: 5132 fps total: 4593 epoch: 112/1500\n",
            "fps step: 6837 fps step and policy inference: 5522 fps total: 4900 epoch: 113/1500\n",
            "fps step: 5842 fps step and policy inference: 4659 fps total: 4159 epoch: 114/1500\n",
            "fps step: 7144 fps step and policy inference: 5928 fps total: 5231 epoch: 115/1500\n",
            "fps step: 7541 fps step and policy inference: 6157 fps total: 5407 epoch: 116/1500\n",
            "fps step: 6888 fps step and policy inference: 5552 fps total: 4916 epoch: 117/1500\n",
            "saving next best rewards:  [3.9874258]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7054 fps step and policy inference: 5695 fps total: 5048 epoch: 118/1500\n",
            "saving next best rewards:  [4.0102034]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 6718 fps step and policy inference: 5427 fps total: 4830 epoch: 119/1500\n",
            "fps step: 7249 fps step and policy inference: 6028 fps total: 5307 epoch: 120/1500\n",
            "saving next best rewards:  [4.2239246]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 5887 fps step and policy inference: 4715 fps total: 4210 epoch: 121/1500\n",
            "saving next best rewards:  [4.306622]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7111 fps step and policy inference: 5836 fps total: 5158 epoch: 122/1500\n",
            "fps step: 7481 fps step and policy inference: 5999 fps total: 5285 epoch: 123/1500\n",
            "saving next best rewards:  [4.3125052]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7495 fps step and policy inference: 6056 fps total: 5317 epoch: 124/1500\n",
            "fps step: 6234 fps step and policy inference: 5106 fps total: 4574 epoch: 125/1500\n",
            "fps step: 7887 fps step and policy inference: 6478 fps total: 5653 epoch: 126/1500\n",
            "saving next best rewards:  [4.346729]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 6480 fps step and policy inference: 5158 fps total: 4615 epoch: 127/1500\n",
            "saving next best rewards:  [4.4043536]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 6830 fps step and policy inference: 5482 fps total: 4878 epoch: 128/1500\n",
            "saving next best rewards:  [4.5567203]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8386 fps step and policy inference: 6823 fps total: 5914 epoch: 129/1500\n",
            "fps step: 7556 fps step and policy inference: 6186 fps total: 5429 epoch: 130/1500\n",
            "saving next best rewards:  [4.637531]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 6324 fps step and policy inference: 5132 fps total: 4601 epoch: 131/1500\n",
            "saving next best rewards:  [4.8382044]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7331 fps step and policy inference: 5911 fps total: 5204 epoch: 132/1500\n",
            "fps step: 7365 fps step and policy inference: 5896 fps total: 5206 epoch: 133/1500\n",
            "fps step: 6208 fps step and policy inference: 4933 fps total: 4438 epoch: 134/1500\n",
            "fps step: 6429 fps step and policy inference: 5151 fps total: 4604 epoch: 135/1500\n",
            "fps step: 6228 fps step and policy inference: 5016 fps total: 4502 epoch: 136/1500\n",
            "fps step: 8148 fps step and policy inference: 6685 fps total: 5812 epoch: 137/1500\n",
            "fps step: 7001 fps step and policy inference: 5710 fps total: 5059 epoch: 138/1500\n",
            "fps step: 7071 fps step and policy inference: 5689 fps total: 5032 epoch: 139/1500\n",
            "saving next best rewards:  [4.911133]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8616 fps step and policy inference: 6935 fps total: 6002 epoch: 140/1500\n",
            "fps step: 6542 fps step and policy inference: 5218 fps total: 4660 epoch: 141/1500\n",
            "saving next best rewards:  [5.0805364]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7193 fps step and policy inference: 5894 fps total: 5188 epoch: 142/1500\n",
            "saving next best rewards:  [5.205803]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 6548 fps step and policy inference: 5189 fps total: 4645 epoch: 143/1500\n",
            "saving next best rewards:  [5.2218266]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7158 fps step and policy inference: 5663 fps total: 5024 epoch: 144/1500\n",
            "fps step: 7488 fps step and policy inference: 6066 fps total: 5322 epoch: 145/1500\n",
            "saving next best rewards:  [5.2892976]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7615 fps step and policy inference: 6204 fps total: 5442 epoch: 146/1500\n",
            "fps step: 7464 fps step and policy inference: 5907 fps total: 5210 epoch: 147/1500\n",
            "fps step: 7646 fps step and policy inference: 6237 fps total: 5467 epoch: 148/1500\n",
            "fps step: 6977 fps step and policy inference: 5515 fps total: 4905 epoch: 149/1500\n",
            "fps step: 6835 fps step and policy inference: 5517 fps total: 4907 epoch: 150/1500\n",
            "fps step: 7534 fps step and policy inference: 6040 fps total: 5314 epoch: 151/1500\n",
            "fps step: 7100 fps step and policy inference: 5825 fps total: 5151 epoch: 152/1500\n",
            "saving next best rewards:  [5.393074]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7563 fps step and policy inference: 6209 fps total: 5450 epoch: 153/1500\n",
            "fps step: 8095 fps step and policy inference: 6478 fps total: 5659 epoch: 154/1500\n",
            "fps step: 6844 fps step and policy inference: 5431 fps total: 4839 epoch: 155/1500\n",
            "saving next best rewards:  [5.5859575]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 6730 fps step and policy inference: 5282 fps total: 4716 epoch: 156/1500\n",
            "saving next best rewards:  [5.738788]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 6590 fps step and policy inference: 5361 fps total: 4788 epoch: 157/1500\n",
            "fps step: 6679 fps step and policy inference: 5323 fps total: 4752 epoch: 158/1500\n",
            "saving next best rewards:  [5.78205]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7290 fps step and policy inference: 5929 fps total: 5229 epoch: 159/1500\n",
            "fps step: 7743 fps step and policy inference: 6143 fps total: 5398 epoch: 160/1500\n",
            "fps step: 7893 fps step and policy inference: 6505 fps total: 5673 epoch: 161/1500\n",
            "fps step: 7202 fps step and policy inference: 5846 fps total: 5166 epoch: 162/1500\n",
            "fps step: 8206 fps step and policy inference: 6546 fps total: 5705 epoch: 163/1500\n",
            "fps step: 7455 fps step and policy inference: 6010 fps total: 5272 epoch: 164/1500\n",
            "fps step: 6836 fps step and policy inference: 5600 fps total: 4973 epoch: 165/1500\n",
            "fps step: 6308 fps step and policy inference: 5040 fps total: 4525 epoch: 166/1500\n",
            "saving next best rewards:  [5.960059]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8042 fps step and policy inference: 6524 fps total: 5685 epoch: 167/1500\n",
            "fps step: 7641 fps step and policy inference: 6206 fps total: 5444 epoch: 168/1500\n",
            "fps step: 7602 fps step and policy inference: 6126 fps total: 5384 epoch: 169/1500\n",
            "fps step: 7092 fps step and policy inference: 5893 fps total: 5201 epoch: 170/1500\n",
            "fps step: 7486 fps step and policy inference: 6088 fps total: 5354 epoch: 171/1500\n",
            "fps step: 7198 fps step and policy inference: 5803 fps total: 5129 epoch: 172/1500\n",
            "fps step: 6950 fps step and policy inference: 5694 fps total: 5045 epoch: 173/1500\n",
            "fps step: 8097 fps step and policy inference: 6673 fps total: 5805 epoch: 174/1500\n",
            "fps step: 6361 fps step and policy inference: 5205 fps total: 4659 epoch: 175/1500\n",
            "saving next best rewards:  [6.125639]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7470 fps step and policy inference: 5999 fps total: 5284 epoch: 176/1500\n",
            "fps step: 8442 fps step and policy inference: 6767 fps total: 5873 epoch: 177/1500\n",
            "fps step: 7086 fps step and policy inference: 5771 fps total: 5107 epoch: 178/1500\n",
            "fps step: 6665 fps step and policy inference: 5295 fps total: 4728 epoch: 179/1500\n",
            "saving next best rewards:  [6.1550446]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7307 fps step and policy inference: 5924 fps total: 5225 epoch: 180/1500\n",
            "saving next best rewards:  [6.248376]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7069 fps step and policy inference: 5673 fps total: 5030 epoch: 181/1500\n",
            "fps step: 7258 fps step and policy inference: 5853 fps total: 5170 epoch: 182/1500\n",
            "fps step: 8899 fps step and policy inference: 7356 fps total: 6314 epoch: 183/1500\n",
            "fps step: 7724 fps step and policy inference: 6271 fps total: 5480 epoch: 184/1500\n",
            "fps step: 7472 fps step and policy inference: 5825 fps total: 5139 epoch: 185/1500\n",
            "saving next best rewards:  [6.646997]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 6860 fps step and policy inference: 5487 fps total: 4866 epoch: 186/1500\n",
            "saving next best rewards:  [6.6519623]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8128 fps step and policy inference: 6634 fps total: 5769 epoch: 187/1500\n",
            "saving next best rewards:  [6.6604214]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7081 fps step and policy inference: 5641 fps total: 4992 epoch: 188/1500\n",
            "fps step: 7817 fps step and policy inference: 6290 fps total: 5504 epoch: 189/1500\n",
            "saving next best rewards:  [6.841798]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7261 fps step and policy inference: 5906 fps total: 5211 epoch: 190/1500\n",
            "fps step: 7617 fps step and policy inference: 6080 fps total: 5348 epoch: 191/1500\n",
            "fps step: 6909 fps step and policy inference: 5510 fps total: 4894 epoch: 192/1500\n",
            "fps step: 6469 fps step and policy inference: 5124 fps total: 4590 epoch: 193/1500\n",
            "fps step: 6499 fps step and policy inference: 5206 fps total: 4649 epoch: 194/1500\n",
            "fps step: 7885 fps step and policy inference: 6387 fps total: 5568 epoch: 195/1500\n",
            "fps step: 7252 fps step and policy inference: 5861 fps total: 5176 epoch: 196/1500\n",
            "fps step: 7768 fps step and policy inference: 6307 fps total: 5522 epoch: 197/1500\n",
            "fps step: 7746 fps step and policy inference: 6373 fps total: 5573 epoch: 198/1500\n",
            "fps step: 7961 fps step and policy inference: 6492 fps total: 5663 epoch: 199/1500\n",
            "saving next best rewards:  [6.9124894]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7044 fps step and policy inference: 5676 fps total: 5031 epoch: 200/1500\n",
            "saving next best rewards:  [7.3546133]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8854 fps step and policy inference: 7245 fps total: 6231 epoch: 201/1500\n",
            "fps step: 7656 fps step and policy inference: 6385 fps total: 5581 epoch: 202/1500\n",
            "fps step: 8300 fps step and policy inference: 6746 fps total: 5858 epoch: 203/1500\n",
            "fps step: 8169 fps step and policy inference: 6718 fps total: 5838 epoch: 204/1500\n",
            "fps step: 7656 fps step and policy inference: 6170 fps total: 5413 epoch: 205/1500\n",
            "fps step: 7198 fps step and policy inference: 5889 fps total: 5186 epoch: 206/1500\n",
            "saving next best rewards:  [7.4263897]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7604 fps step and policy inference: 6035 fps total: 5295 epoch: 207/1500\n",
            "fps step: 8665 fps step and policy inference: 6979 fps total: 6031 epoch: 208/1500\n",
            "saving next best rewards:  [7.488877]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8519 fps step and policy inference: 6848 fps total: 5932 epoch: 209/1500\n",
            "fps step: 6974 fps step and policy inference: 5602 fps total: 4967 epoch: 210/1500\n",
            "saving next best rewards:  [7.9715753]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7190 fps step and policy inference: 5691 fps total: 5039 epoch: 211/1500\n",
            "saving next best rewards:  [8.114768]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 6804 fps step and policy inference: 5539 fps total: 4926 epoch: 212/1500\n",
            "fps step: 7254 fps step and policy inference: 5865 fps total: 5181 epoch: 213/1500\n",
            "fps step: 7317 fps step and policy inference: 5904 fps total: 5200 epoch: 214/1500\n",
            "fps step: 6749 fps step and policy inference: 5343 fps total: 4765 epoch: 215/1500\n",
            "fps step: 8876 fps step and policy inference: 7127 fps total: 6141 epoch: 216/1500\n",
            "fps step: 9484 fps step and policy inference: 7634 fps total: 6517 epoch: 217/1500\n",
            "fps step: 8081 fps step and policy inference: 6512 fps total: 5682 epoch: 218/1500\n",
            "fps step: 6462 fps step and policy inference: 5205 fps total: 4655 epoch: 219/1500\n",
            "fps step: 8100 fps step and policy inference: 6535 fps total: 5697 epoch: 220/1500\n",
            "fps step: 8335 fps step and policy inference: 6754 fps total: 5851 epoch: 221/1500\n",
            "saving next best rewards:  [8.237596]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7231 fps step and policy inference: 5729 fps total: 5078 epoch: 222/1500\n",
            "saving next best rewards:  [8.379279]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 6931 fps step and policy inference: 5543 fps total: 4931 epoch: 223/1500\n",
            "fps step: 8209 fps step and policy inference: 6645 fps total: 5781 epoch: 224/1500\n",
            "fps step: 7844 fps step and policy inference: 6197 fps total: 5428 epoch: 225/1500\n",
            "fps step: 8087 fps step and policy inference: 6502 fps total: 5642 epoch: 226/1500\n",
            "saving next best rewards:  [8.456155]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 9046 fps step and policy inference: 7322 fps total: 6292 epoch: 227/1500\n",
            "saving next best rewards:  [8.653183]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7418 fps step and policy inference: 5894 fps total: 5203 epoch: 228/1500\n",
            "saving next best rewards:  [8.85155]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7018 fps step and policy inference: 5663 fps total: 5026 epoch: 229/1500\n",
            "saving next best rewards:  [9.224875]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8143 fps step and policy inference: 6501 fps total: 5671 epoch: 230/1500\n",
            "saving next best rewards:  [9.334941]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7727 fps step and policy inference: 6104 fps total: 5374 epoch: 231/1500\n",
            "saving next best rewards:  [9.358768]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8034 fps step and policy inference: 6487 fps total: 5659 epoch: 232/1500\n",
            "fps step: 7653 fps step and policy inference: 6277 fps total: 5504 epoch: 233/1500\n",
            "fps step: 7362 fps step and policy inference: 5972 fps total: 5269 epoch: 234/1500\n",
            "fps step: 7119 fps step and policy inference: 5686 fps total: 5042 epoch: 235/1500\n",
            "fps step: 8333 fps step and policy inference: 6822 fps total: 5919 epoch: 236/1500\n",
            "fps step: 7071 fps step and policy inference: 5598 fps total: 4959 epoch: 237/1500\n",
            "fps step: 8191 fps step and policy inference: 6680 fps total: 5807 epoch: 238/1500\n",
            "fps step: 7491 fps step and policy inference: 6025 fps total: 5299 epoch: 239/1500\n",
            "fps step: 7400 fps step and policy inference: 5929 fps total: 5227 epoch: 240/1500\n",
            "fps step: 7577 fps step and policy inference: 6224 fps total: 5458 epoch: 241/1500\n",
            "fps step: 7248 fps step and policy inference: 5869 fps total: 5187 epoch: 242/1500\n",
            "fps step: 7636 fps step and policy inference: 6156 fps total: 5402 epoch: 243/1500\n",
            "fps step: 7345 fps step and policy inference: 5973 fps total: 5259 epoch: 244/1500\n",
            "fps step: 7539 fps step and policy inference: 6052 fps total: 5325 epoch: 245/1500\n",
            "fps step: 7911 fps step and policy inference: 6469 fps total: 5645 epoch: 246/1500\n",
            "fps step: 8394 fps step and policy inference: 6773 fps total: 5875 epoch: 247/1500\n",
            "fps step: 8220 fps step and policy inference: 6710 fps total: 5830 epoch: 248/1500\n",
            "fps step: 8519 fps step and policy inference: 6889 fps total: 5945 epoch: 249/1500\n",
            "fps step: 6638 fps step and policy inference: 5375 fps total: 4797 epoch: 250/1500\n",
            "fps step: 9000 fps step and policy inference: 7377 fps total: 6326 epoch: 251/1500\n",
            "fps step: 7815 fps step and policy inference: 6339 fps total: 5546 epoch: 252/1500\n",
            "fps step: 7825 fps step and policy inference: 6267 fps total: 5494 epoch: 253/1500\n",
            "fps step: 7556 fps step and policy inference: 6053 fps total: 5322 epoch: 254/1500\n",
            "fps step: 7388 fps step and policy inference: 5932 fps total: 5230 epoch: 255/1500\n",
            "fps step: 8351 fps step and policy inference: 6752 fps total: 5863 epoch: 256/1500\n",
            "fps step: 9525 fps step and policy inference: 7701 fps total: 6563 epoch: 257/1500\n",
            "fps step: 8508 fps step and policy inference: 6904 fps total: 5974 epoch: 258/1500\n",
            "saving next best rewards:  [9.792122]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7830 fps step and policy inference: 6215 fps total: 5444 epoch: 259/1500\n",
            "saving next best rewards:  [9.908857]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8811 fps step and policy inference: 7066 fps total: 6080 epoch: 260/1500\n",
            "saving next best rewards:  [10.201598]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 6793 fps step and policy inference: 5422 fps total: 4832 epoch: 261/1500\n",
            "saving next best rewards:  [10.590834]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7339 fps step and policy inference: 5930 fps total: 5214 epoch: 262/1500\n",
            "fps step: 7875 fps step and policy inference: 6355 fps total: 5559 epoch: 263/1500\n",
            "fps step: 6757 fps step and policy inference: 5437 fps total: 4839 epoch: 264/1500\n",
            "fps step: 7875 fps step and policy inference: 6296 fps total: 5513 epoch: 265/1500\n",
            "fps step: 8787 fps step and policy inference: 6923 fps total: 5982 epoch: 266/1500\n",
            "fps step: 8161 fps step and policy inference: 6516 fps total: 5683 epoch: 267/1500\n",
            "fps step: 7039 fps step and policy inference: 5492 fps total: 4883 epoch: 268/1500\n",
            "fps step: 8355 fps step and policy inference: 6725 fps total: 5839 epoch: 269/1500\n",
            "fps step: 8209 fps step and policy inference: 6702 fps total: 5823 epoch: 270/1500\n",
            "fps step: 8270 fps step and policy inference: 6723 fps total: 5840 epoch: 271/1500\n",
            "saving next best rewards:  [11.15418]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7482 fps step and policy inference: 5925 fps total: 5227 epoch: 272/1500\n",
            "fps step: 7455 fps step and policy inference: 5946 fps total: 5243 epoch: 273/1500\n",
            "fps step: 7827 fps step and policy inference: 6275 fps total: 5483 epoch: 274/1500\n",
            "fps step: 7325 fps step and policy inference: 5811 fps total: 5133 epoch: 275/1500\n",
            "fps step: 9285 fps step and policy inference: 7497 fps total: 6413 epoch: 276/1500\n",
            "fps step: 9308 fps step and policy inference: 7608 fps total: 6497 epoch: 277/1500\n",
            "fps step: 8415 fps step and policy inference: 6751 fps total: 5857 epoch: 278/1500\n",
            "fps step: 7088 fps step and policy inference: 5634 fps total: 4998 epoch: 279/1500\n",
            "fps step: 8482 fps step and policy inference: 6936 fps total: 5997 epoch: 280/1500\n",
            "fps step: 7273 fps step and policy inference: 5989 fps total: 5277 epoch: 281/1500\n",
            "fps step: 6572 fps step and policy inference: 5206 fps total: 4658 epoch: 282/1500\n",
            "fps step: 6833 fps step and policy inference: 5501 fps total: 4892 epoch: 283/1500\n",
            "fps step: 7779 fps step and policy inference: 6225 fps total: 5459 epoch: 284/1500\n",
            "fps step: 7285 fps step and policy inference: 5715 fps total: 5054 epoch: 285/1500\n",
            "fps step: 7847 fps step and policy inference: 6252 fps total: 5483 epoch: 286/1500\n",
            "fps step: 7644 fps step and policy inference: 5999 fps total: 5282 epoch: 287/1500\n",
            "fps step: 9173 fps step and policy inference: 7294 fps total: 6265 epoch: 288/1500\n",
            "fps step: 6999 fps step and policy inference: 5655 fps total: 5004 epoch: 289/1500\n",
            "fps step: 8092 fps step and policy inference: 6575 fps total: 5712 epoch: 290/1500\n",
            "fps step: 8869 fps step and policy inference: 7180 fps total: 6178 epoch: 291/1500\n",
            "fps step: 8268 fps step and policy inference: 6842 fps total: 5929 epoch: 292/1500\n",
            "saving next best rewards:  [11.2650385]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7672 fps step and policy inference: 6213 fps total: 5449 epoch: 293/1500\n",
            "fps step: 8263 fps step and policy inference: 6791 fps total: 5892 epoch: 294/1500\n",
            "fps step: 7221 fps step and policy inference: 5842 fps total: 5163 epoch: 295/1500\n",
            "fps step: 7411 fps step and policy inference: 5920 fps total: 5209 epoch: 296/1500\n",
            "fps step: 8399 fps step and policy inference: 6798 fps total: 5887 epoch: 297/1500\n",
            "fps step: 7841 fps step and policy inference: 6262 fps total: 5488 epoch: 298/1500\n",
            "fps step: 7462 fps step and policy inference: 5976 fps total: 5265 epoch: 299/1500\n",
            "fps step: 7543 fps step and policy inference: 5905 fps total: 5207 epoch: 300/1500\n",
            "fps step: 8169 fps step and policy inference: 6682 fps total: 5803 epoch: 301/1500\n",
            "fps step: 8770 fps step and policy inference: 7131 fps total: 6145 epoch: 302/1500\n",
            "fps step: 7339 fps step and policy inference: 5876 fps total: 5189 epoch: 303/1500\n",
            "fps step: 7668 fps step and policy inference: 6147 fps total: 5399 epoch: 304/1500\n",
            "fps step: 8366 fps step and policy inference: 6800 fps total: 5898 epoch: 305/1500\n",
            "saving next best rewards:  [11.321135]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 6798 fps step and policy inference: 5429 fps total: 4834 epoch: 306/1500\n",
            "saving next best rewards:  [11.347021]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8069 fps step and policy inference: 6491 fps total: 5663 epoch: 307/1500\n",
            "fps step: 7530 fps step and policy inference: 6112 fps total: 5374 epoch: 308/1500\n",
            "fps step: 8680 fps step and policy inference: 7036 fps total: 6084 epoch: 309/1500\n",
            "fps step: 8323 fps step and policy inference: 6670 fps total: 5799 epoch: 310/1500\n",
            "fps step: 7143 fps step and policy inference: 5714 fps total: 5060 epoch: 311/1500\n",
            "fps step: 6311 fps step and policy inference: 5076 fps total: 4552 epoch: 312/1500\n",
            "fps step: 7310 fps step and policy inference: 5807 fps total: 5135 epoch: 313/1500\n",
            "fps step: 8471 fps step and policy inference: 6841 fps total: 5932 epoch: 314/1500\n",
            "fps step: 8673 fps step and policy inference: 7098 fps total: 6119 epoch: 315/1500\n",
            "fps step: 7901 fps step and policy inference: 6411 fps total: 5604 epoch: 316/1500\n",
            "fps step: 7909 fps step and policy inference: 6422 fps total: 5599 epoch: 317/1500\n",
            "saving next best rewards:  [11.678578]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8263 fps step and policy inference: 6776 fps total: 5881 epoch: 318/1500\n",
            "saving next best rewards:  [11.837453]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 9121 fps step and policy inference: 7325 fps total: 6278 epoch: 319/1500\n",
            "fps step: 8322 fps step and policy inference: 6739 fps total: 5851 epoch: 320/1500\n",
            "fps step: 7299 fps step and policy inference: 5866 fps total: 5169 epoch: 321/1500\n",
            "fps step: 7832 fps step and policy inference: 6176 fps total: 5421 epoch: 322/1500\n",
            "fps step: 7440 fps step and policy inference: 5792 fps total: 5120 epoch: 323/1500\n",
            "fps step: 7552 fps step and policy inference: 6042 fps total: 5317 epoch: 324/1500\n",
            "fps step: 8762 fps step and policy inference: 7087 fps total: 6111 epoch: 325/1500\n",
            "saving next best rewards:  [11.961185]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 6990 fps step and policy inference: 5702 fps total: 5051 epoch: 326/1500\n",
            "saving next best rewards:  [12.419674]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8376 fps step and policy inference: 6654 fps total: 5786 epoch: 327/1500\n",
            "fps step: 7928 fps step and policy inference: 6353 fps total: 5560 epoch: 328/1500\n",
            "fps step: 7714 fps step and policy inference: 6158 fps total: 5416 epoch: 329/1500\n",
            "fps step: 9261 fps step and policy inference: 7599 fps total: 6487 epoch: 330/1500\n",
            "fps step: 8176 fps step and policy inference: 6574 fps total: 5721 epoch: 331/1500\n",
            "fps step: 8228 fps step and policy inference: 6533 fps total: 5692 epoch: 332/1500\n",
            "saving next best rewards:  [12.646646]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8513 fps step and policy inference: 6899 fps total: 5968 epoch: 333/1500\n",
            "fps step: 8416 fps step and policy inference: 6753 fps total: 5860 epoch: 334/1500\n",
            "fps step: 6616 fps step and policy inference: 5082 fps total: 4559 epoch: 335/1500\n",
            "saving next best rewards:  [12.842021]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 6852 fps step and policy inference: 5546 fps total: 4929 epoch: 336/1500\n",
            "saving next best rewards:  [13.191847]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7808 fps step and policy inference: 6205 fps total: 5443 epoch: 337/1500\n",
            "fps step: 8848 fps step and policy inference: 7121 fps total: 6136 epoch: 338/1500\n",
            "saving next best rewards:  [13.808141]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8275 fps step and policy inference: 6519 fps total: 5685 epoch: 339/1500\n",
            "fps step: 7351 fps step and policy inference: 5890 fps total: 5198 epoch: 340/1500\n",
            "fps step: 7772 fps step and policy inference: 6229 fps total: 5464 epoch: 341/1500\n",
            "fps step: 9105 fps step and policy inference: 7409 fps total: 6355 epoch: 342/1500\n",
            "fps step: 8723 fps step and policy inference: 7022 fps total: 6065 epoch: 343/1500\n",
            "fps step: 7649 fps step and policy inference: 6184 fps total: 5428 epoch: 344/1500\n",
            "fps step: 7123 fps step and policy inference: 5663 fps total: 5022 epoch: 345/1500\n",
            "fps step: 7590 fps step and policy inference: 6192 fps total: 5440 epoch: 346/1500\n",
            "saving next best rewards:  [14.107501]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7662 fps step and policy inference: 6157 fps total: 5411 epoch: 347/1500\n",
            "saving next best rewards:  [15.062423]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8137 fps step and policy inference: 6588 fps total: 5740 epoch: 348/1500\n",
            "saving next best rewards:  [15.098409]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7555 fps step and policy inference: 6108 fps total: 5374 epoch: 349/1500\n",
            "fps step: 7776 fps step and policy inference: 6347 fps total: 5547 epoch: 350/1500\n",
            "fps step: 9113 fps step and policy inference: 7370 fps total: 6324 epoch: 351/1500\n",
            "fps step: 8326 fps step and policy inference: 6639 fps total: 5775 epoch: 352/1500\n",
            "fps step: 7383 fps step and policy inference: 5947 fps total: 5232 epoch: 353/1500\n",
            "fps step: 8558 fps step and policy inference: 6971 fps total: 6025 epoch: 354/1500\n",
            "saving next best rewards:  [15.110613]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8649 fps step and policy inference: 6794 fps total: 5890 epoch: 355/1500\n",
            "saving next best rewards:  [15.657738]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7661 fps step and policy inference: 6104 fps total: 5366 epoch: 356/1500\n",
            "saving next best rewards:  [16.597609]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7550 fps step and policy inference: 5996 fps total: 5281 epoch: 357/1500\n",
            "fps step: 7828 fps step and policy inference: 6321 fps total: 5531 epoch: 358/1500\n",
            "fps step: 8230 fps step and policy inference: 6722 fps total: 5838 epoch: 359/1500\n",
            "fps step: 7240 fps step and policy inference: 5791 fps total: 5122 epoch: 360/1500\n",
            "fps step: 8619 fps step and policy inference: 6934 fps total: 5997 epoch: 361/1500\n",
            "fps step: 7996 fps step and policy inference: 6479 fps total: 5638 epoch: 362/1500\n",
            "fps step: 7761 fps step and policy inference: 6127 fps total: 5384 epoch: 363/1500\n",
            "fps step: 7161 fps step and policy inference: 5733 fps total: 5078 epoch: 364/1500\n",
            "fps step: 8731 fps step and policy inference: 7068 fps total: 6097 epoch: 365/1500\n",
            "fps step: 8752 fps step and policy inference: 6958 fps total: 6025 epoch: 366/1500\n",
            "fps step: 7985 fps step and policy inference: 6606 fps total: 5752 epoch: 367/1500\n",
            "fps step: 8491 fps step and policy inference: 6890 fps total: 5965 epoch: 368/1500\n",
            "fps step: 9420 fps step and policy inference: 7542 fps total: 6444 epoch: 369/1500\n",
            "fps step: 7486 fps step and policy inference: 6122 fps total: 5380 epoch: 370/1500\n",
            "fps step: 7589 fps step and policy inference: 6134 fps total: 5390 epoch: 371/1500\n",
            "fps step: 7899 fps step and policy inference: 6386 fps total: 5581 epoch: 372/1500\n",
            "fps step: 8446 fps step and policy inference: 6725 fps total: 5841 epoch: 373/1500\n",
            "fps step: 7730 fps step and policy inference: 6064 fps total: 5336 epoch: 374/1500\n",
            "fps step: 7816 fps step and policy inference: 6218 fps total: 5455 epoch: 375/1500\n",
            "fps step: 8185 fps step and policy inference: 6524 fps total: 5687 epoch: 376/1500\n",
            "fps step: 8234 fps step and policy inference: 6675 fps total: 5804 epoch: 377/1500\n",
            "fps step: 7397 fps step and policy inference: 5962 fps total: 5260 epoch: 378/1500\n",
            "fps step: 8358 fps step and policy inference: 6717 fps total: 5834 epoch: 379/1500\n",
            "fps step: 8349 fps step and policy inference: 6705 fps total: 5826 epoch: 380/1500\n",
            "saving next best rewards:  [16.893972]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7034 fps step and policy inference: 5535 fps total: 4926 epoch: 381/1500\n",
            "saving next best rewards:  [16.930658]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7697 fps step and policy inference: 6092 fps total: 5357 epoch: 382/1500\n",
            "fps step: 7449 fps step and policy inference: 6014 fps total: 5295 epoch: 383/1500\n",
            "fps step: 6691 fps step and policy inference: 5210 fps total: 4658 epoch: 384/1500\n",
            "saving next best rewards:  [17.175018]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7481 fps step and policy inference: 5916 fps total: 5220 epoch: 385/1500\n",
            "fps step: 9373 fps step and policy inference: 7530 fps total: 6419 epoch: 386/1500\n",
            "saving next best rewards:  [17.544489]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7549 fps step and policy inference: 5928 fps total: 5217 epoch: 387/1500\n",
            "saving next best rewards:  [19.912893]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8511 fps step and policy inference: 6857 fps total: 5938 epoch: 388/1500\n",
            "fps step: 8583 fps step and policy inference: 6965 fps total: 6021 epoch: 389/1500\n",
            "fps step: 8667 fps step and policy inference: 6975 fps total: 6027 epoch: 390/1500\n",
            "fps step: 8592 fps step and policy inference: 7079 fps total: 6106 epoch: 391/1500\n",
            "fps step: 8741 fps step and policy inference: 6966 fps total: 6024 epoch: 392/1500\n",
            "fps step: 8542 fps step and policy inference: 6929 fps total: 5994 epoch: 393/1500\n",
            "fps step: 8855 fps step and policy inference: 7258 fps total: 6232 epoch: 394/1500\n",
            "fps step: 7493 fps step and policy inference: 5979 fps total: 5273 epoch: 395/1500\n",
            "saving next best rewards:  [20.93684]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 9057 fps step and policy inference: 7295 fps total: 6265 epoch: 396/1500\n",
            "fps step: 8998 fps step and policy inference: 7218 fps total: 6207 epoch: 397/1500\n",
            "fps step: 8320 fps step and policy inference: 6620 fps total: 5766 epoch: 398/1500\n",
            "saving next best rewards:  [21.675663]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 9818 fps step and policy inference: 7927 fps total: 6706 epoch: 399/1500\n",
            "saving next best rewards:  [22.008396]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8851 fps step and policy inference: 7094 fps total: 6114 epoch: 400/1500\n",
            "saving next best rewards:  [22.433498]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7461 fps step and policy inference: 5927 fps total: 5228 epoch: 401/1500\n",
            "fps step: 7897 fps step and policy inference: 6396 fps total: 5593 epoch: 402/1500\n",
            "saving next best rewards:  [22.817749]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8477 fps step and policy inference: 6871 fps total: 5951 epoch: 403/1500\n",
            "fps step: 8586 fps step and policy inference: 7028 fps total: 6074 epoch: 404/1500\n",
            "fps step: 7409 fps step and policy inference: 5832 fps total: 5154 epoch: 405/1500\n",
            "fps step: 8404 fps step and policy inference: 6693 fps total: 5813 epoch: 406/1500\n",
            "saving next best rewards:  [24.379225]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8275 fps step and policy inference: 6577 fps total: 5728 epoch: 407/1500\n",
            "fps step: 7815 fps step and policy inference: 6262 fps total: 5491 epoch: 408/1500\n",
            "fps step: 10027 fps step and policy inference: 8008 fps total: 6784 epoch: 409/1500\n",
            "fps step: 8058 fps step and policy inference: 6548 fps total: 5709 epoch: 410/1500\n",
            "fps step: 7838 fps step and policy inference: 6241 fps total: 5469 epoch: 411/1500\n",
            "fps step: 8389 fps step and policy inference: 6918 fps total: 5988 epoch: 412/1500\n",
            "fps step: 9135 fps step and policy inference: 7320 fps total: 6285 epoch: 413/1500\n",
            "fps step: 10168 fps step and policy inference: 8221 fps total: 6928 epoch: 414/1500\n",
            "fps step: 7972 fps step and policy inference: 6421 fps total: 5609 epoch: 415/1500\n",
            "fps step: 8491 fps step and policy inference: 6744 fps total: 5863 epoch: 416/1500\n",
            "fps step: 9131 fps step and policy inference: 7321 fps total: 6278 epoch: 417/1500\n",
            "fps step: 8436 fps step and policy inference: 6950 fps total: 6011 epoch: 418/1500\n",
            "saving next best rewards:  [26.52502]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8281 fps step and policy inference: 6645 fps total: 5775 epoch: 419/1500\n",
            "saving next best rewards:  [27.020956]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7950 fps step and policy inference: 6278 fps total: 5482 epoch: 420/1500\n",
            "fps step: 9388 fps step and policy inference: 7560 fps total: 6459 epoch: 421/1500\n",
            "fps step: 9767 fps step and policy inference: 7781 fps total: 6615 epoch: 422/1500\n",
            "fps step: 8975 fps step and policy inference: 7129 fps total: 6142 epoch: 423/1500\n",
            "fps step: 8700 fps step and policy inference: 6993 fps total: 6039 epoch: 424/1500\n",
            "saving next best rewards:  [30.730392]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8842 fps step and policy inference: 7184 fps total: 6183 epoch: 425/1500\n",
            "fps step: 7469 fps step and policy inference: 5872 fps total: 5186 epoch: 426/1500\n",
            "fps step: 8739 fps step and policy inference: 7049 fps total: 6082 epoch: 427/1500\n",
            "saving next best rewards:  [32.12111]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7933 fps step and policy inference: 6299 fps total: 5515 epoch: 428/1500\n",
            "saving next best rewards:  [32.28975]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8548 fps step and policy inference: 6777 fps total: 5839 epoch: 429/1500\n",
            "fps step: 8861 fps step and policy inference: 7081 fps total: 6107 epoch: 430/1500\n",
            "fps step: 8544 fps step and policy inference: 6917 fps total: 5986 epoch: 431/1500\n",
            "fps step: 8453 fps step and policy inference: 6795 fps total: 5891 epoch: 432/1500\n",
            "fps step: 7787 fps step and policy inference: 6123 fps total: 5369 epoch: 433/1500\n",
            "fps step: 7415 fps step and policy inference: 5856 fps total: 5173 epoch: 434/1500\n",
            "saving next best rewards:  [35.929085]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7571 fps step and policy inference: 5917 fps total: 5219 epoch: 435/1500\n",
            "fps step: 7460 fps step and policy inference: 5933 fps total: 5234 epoch: 436/1500\n",
            "fps step: 9446 fps step and policy inference: 7614 fps total: 6501 epoch: 437/1500\n",
            "fps step: 7470 fps step and policy inference: 5971 fps total: 5259 epoch: 438/1500\n",
            "fps step: 9480 fps step and policy inference: 7633 fps total: 6515 epoch: 439/1500\n",
            "fps step: 8468 fps step and policy inference: 6788 fps total: 5864 epoch: 440/1500\n",
            "fps step: 7449 fps step and policy inference: 5916 fps total: 5222 epoch: 441/1500\n",
            "fps step: 7689 fps step and policy inference: 6213 fps total: 5450 epoch: 442/1500\n",
            "fps step: 8857 fps step and policy inference: 7200 fps total: 6198 epoch: 443/1500\n",
            "fps step: 7807 fps step and policy inference: 6264 fps total: 5489 epoch: 444/1500\n",
            "fps step: 8853 fps step and policy inference: 7157 fps total: 6164 epoch: 445/1500\n",
            "fps step: 8279 fps step and policy inference: 6592 fps total: 5738 epoch: 446/1500\n",
            "fps step: 7140 fps step and policy inference: 5627 fps total: 4883 epoch: 447/1500\n",
            "fps step: 9511 fps step and policy inference: 7516 fps total: 6426 epoch: 448/1500\n",
            "fps step: 9568 fps step and policy inference: 7749 fps total: 6598 epoch: 449/1500\n",
            "fps step: 9386 fps step and policy inference: 7544 fps total: 6436 epoch: 450/1500\n",
            "fps step: 7994 fps step and policy inference: 6412 fps total: 5603 epoch: 451/1500\n",
            "fps step: 7461 fps step and policy inference: 6010 fps total: 5295 epoch: 452/1500\n",
            "fps step: 9280 fps step and policy inference: 7533 fps total: 6441 epoch: 453/1500\n",
            "fps step: 8339 fps step and policy inference: 6651 fps total: 5784 epoch: 454/1500\n",
            "fps step: 8359 fps step and policy inference: 6751 fps total: 5851 epoch: 455/1500\n",
            "fps step: 8664 fps step and policy inference: 7048 fps total: 6083 epoch: 456/1500\n",
            "fps step: 8867 fps step and policy inference: 7109 fps total: 6130 epoch: 457/1500\n",
            "fps step: 8286 fps step and policy inference: 6657 fps total: 5788 epoch: 458/1500\n",
            "saving next best rewards:  [37.00623]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8299 fps step and policy inference: 6691 fps total: 5798 epoch: 459/1500\n",
            "saving next best rewards:  [38.876015]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8861 fps step and policy inference: 7211 fps total: 6203 epoch: 460/1500\n",
            "fps step: 8246 fps step and policy inference: 6563 fps total: 5719 epoch: 461/1500\n",
            "fps step: 9647 fps step and policy inference: 7708 fps total: 6569 epoch: 462/1500\n",
            "fps step: 9075 fps step and policy inference: 7264 fps total: 6241 epoch: 463/1500\n",
            "fps step: 8117 fps step and policy inference: 6615 fps total: 5756 epoch: 464/1500\n",
            "fps step: 9350 fps step and policy inference: 7510 fps total: 6423 epoch: 465/1500\n",
            "fps step: 7249 fps step and policy inference: 5886 fps total: 5198 epoch: 466/1500\n",
            "fps step: 8657 fps step and policy inference: 7042 fps total: 6080 epoch: 467/1500\n",
            "fps step: 7956 fps step and policy inference: 6513 fps total: 5684 epoch: 468/1500\n",
            "fps step: 9139 fps step and policy inference: 7305 fps total: 6273 epoch: 469/1500\n",
            "fps step: 8697 fps step and policy inference: 7126 fps total: 6145 epoch: 470/1500\n",
            "fps step: 8709 fps step and policy inference: 6998 fps total: 6031 epoch: 471/1500\n",
            "fps step: 7910 fps step and policy inference: 6275 fps total: 5498 epoch: 472/1500\n",
            "fps step: 8376 fps step and policy inference: 6804 fps total: 5899 epoch: 473/1500\n",
            "saving next best rewards:  [39.874485]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8244 fps step and policy inference: 6563 fps total: 5718 epoch: 474/1500\n",
            "fps step: 8751 fps step and policy inference: 7001 fps total: 6050 epoch: 475/1500\n",
            "fps step: 7518 fps step and policy inference: 6004 fps total: 5289 epoch: 476/1500\n",
            "fps step: 8750 fps step and policy inference: 6933 fps total: 6002 epoch: 477/1500\n",
            "fps step: 9240 fps step and policy inference: 7516 fps total: 6432 epoch: 478/1500\n",
            "fps step: 8842 fps step and policy inference: 7185 fps total: 6170 epoch: 479/1500\n",
            "fps step: 7882 fps step and policy inference: 6296 fps total: 5515 epoch: 480/1500\n",
            "fps step: 9194 fps step and policy inference: 7516 fps total: 6429 epoch: 481/1500\n",
            "saving next best rewards:  [40.514366]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8459 fps step and policy inference: 6704 fps total: 5828 epoch: 482/1500\n",
            "fps step: 8991 fps step and policy inference: 7160 fps total: 6164 epoch: 483/1500\n",
            "fps step: 9252 fps step and policy inference: 7545 fps total: 6445 epoch: 484/1500\n",
            "saving next best rewards:  [44.334324]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7908 fps step and policy inference: 6186 fps total: 5427 epoch: 485/1500\n",
            "fps step: 9034 fps step and policy inference: 7233 fps total: 6205 epoch: 486/1500\n",
            "saving next best rewards:  [48.218758]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 7958 fps step and policy inference: 6290 fps total: 5506 epoch: 487/1500\n",
            "saving next best rewards:  [54.320667]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8048 fps step and policy inference: 6426 fps total: 5614 epoch: 488/1500\n",
            "fps step: 8453 fps step and policy inference: 6715 fps total: 5832 epoch: 489/1500\n",
            "fps step: 8858 fps step and policy inference: 7050 fps total: 6088 epoch: 490/1500\n",
            "fps step: 8182 fps step and policy inference: 6597 fps total: 5743 epoch: 491/1500\n",
            "fps step: 8065 fps step and policy inference: 6427 fps total: 5614 epoch: 492/1500\n",
            "fps step: 8237 fps step and policy inference: 6641 fps total: 5780 epoch: 493/1500\n",
            "fps step: 8279 fps step and policy inference: 6636 fps total: 5774 epoch: 494/1500\n",
            "fps step: 7772 fps step and policy inference: 6076 fps total: 5343 epoch: 495/1500\n",
            "fps step: 9724 fps step and policy inference: 7753 fps total: 6574 epoch: 496/1500\n",
            "fps step: 8277 fps step and policy inference: 6640 fps total: 5766 epoch: 497/1500\n",
            "fps step: 7567 fps step and policy inference: 5980 fps total: 5270 epoch: 498/1500\n",
            "fps step: 8572 fps step and policy inference: 6832 fps total: 5922 epoch: 499/1500\n",
            "fps step: 8403 fps step and policy inference: 6699 fps total: 5830 epoch: 500/1500\n",
            "fps step: 9213 fps step and policy inference: 7582 fps total: 6478 epoch: 501/1500\n",
            "fps step: 8189 fps step and policy inference: 6607 fps total: 5750 epoch: 502/1500\n",
            "fps step: 8497 fps step and policy inference: 6796 fps total: 5892 epoch: 503/1500\n",
            "fps step: 7445 fps step and policy inference: 6016 fps total: 5305 epoch: 504/1500\n",
            "fps step: 9246 fps step and policy inference: 7447 fps total: 6386 epoch: 505/1500\n",
            "fps step: 8419 fps step and policy inference: 6670 fps total: 5799 epoch: 506/1500\n",
            "fps step: 8943 fps step and policy inference: 7169 fps total: 6179 epoch: 507/1500\n",
            "fps step: 8724 fps step and policy inference: 6959 fps total: 6001 epoch: 508/1500\n",
            "fps step: 8592 fps step and policy inference: 6922 fps total: 5989 epoch: 509/1500\n",
            "fps step: 9197 fps step and policy inference: 7424 fps total: 6361 epoch: 510/1500\n",
            "fps step: 8259 fps step and policy inference: 6628 fps total: 5753 epoch: 511/1500\n",
            "fps step: 8020 fps step and policy inference: 6435 fps total: 5621 epoch: 512/1500\n",
            "fps step: 8032 fps step and policy inference: 6347 fps total: 5552 epoch: 513/1500\n",
            "fps step: 9426 fps step and policy inference: 7514 fps total: 6428 epoch: 514/1500\n",
            "fps step: 7895 fps step and policy inference: 6314 fps total: 5528 epoch: 515/1500\n",
            "fps step: 9298 fps step and policy inference: 7576 fps total: 6456 epoch: 516/1500\n",
            "fps step: 9499 fps step and policy inference: 7572 fps total: 6469 epoch: 517/1500\n",
            "fps step: 8172 fps step and policy inference: 6528 fps total: 5691 epoch: 518/1500\n",
            "fps step: 7840 fps step and policy inference: 6241 fps total: 5455 epoch: 519/1500\n",
            "fps step: 7691 fps step and policy inference: 6041 fps total: 5318 epoch: 520/1500\n",
            "fps step: 8040 fps step and policy inference: 6397 fps total: 5590 epoch: 521/1500\n",
            "fps step: 7838 fps step and policy inference: 6289 fps total: 5510 epoch: 522/1500\n",
            "fps step: 7513 fps step and policy inference: 5989 fps total: 5276 epoch: 523/1500\n",
            "fps step: 8649 fps step and policy inference: 6933 fps total: 5998 epoch: 524/1500\n",
            "fps step: 9073 fps step and policy inference: 7275 fps total: 6263 epoch: 525/1500\n",
            "fps step: 8183 fps step and policy inference: 6593 fps total: 5739 epoch: 526/1500\n",
            "fps step: 9781 fps step and policy inference: 7803 fps total: 6646 epoch: 527/1500\n",
            "fps step: 7417 fps step and policy inference: 5827 fps total: 5155 epoch: 528/1500\n",
            "fps step: 7926 fps step and policy inference: 6295 fps total: 5510 epoch: 529/1500\n",
            "fps step: 8687 fps step and policy inference: 6933 fps total: 5997 epoch: 530/1500\n",
            "fps step: 7692 fps step and policy inference: 6148 fps total: 5401 epoch: 531/1500\n",
            "fps step: 7884 fps step and policy inference: 6332 fps total: 5547 epoch: 532/1500\n",
            "fps step: 8530 fps step and policy inference: 7029 fps total: 6062 epoch: 533/1500\n",
            "fps step: 9057 fps step and policy inference: 7429 fps total: 6365 epoch: 534/1500\n",
            "fps step: 9249 fps step and policy inference: 7374 fps total: 6324 epoch: 535/1500\n",
            "fps step: 8680 fps step and policy inference: 6893 fps total: 5965 epoch: 536/1500\n",
            "fps step: 8265 fps step and policy inference: 6613 fps total: 5766 epoch: 537/1500\n",
            "fps step: 8827 fps step and policy inference: 6919 fps total: 5982 epoch: 538/1500\n",
            "fps step: 7534 fps step and policy inference: 5865 fps total: 5179 epoch: 539/1500\n",
            "fps step: 8149 fps step and policy inference: 6613 fps total: 5760 epoch: 540/1500\n",
            "fps step: 9224 fps step and policy inference: 7264 fps total: 6224 epoch: 541/1500\n",
            "fps step: 9363 fps step and policy inference: 7524 fps total: 6432 epoch: 542/1500\n",
            "fps step: 8115 fps step and policy inference: 6504 fps total: 5658 epoch: 543/1500\n",
            "saving next best rewards:  [55.079437]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8935 fps step and policy inference: 7212 fps total: 6186 epoch: 544/1500\n",
            "saving next best rewards:  [55.281284]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8638 fps step and policy inference: 6857 fps total: 5939 epoch: 545/1500\n",
            "saving next best rewards:  [59.68618]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8067 fps step and policy inference: 6619 fps total: 5760 epoch: 546/1500\n",
            "fps step: 7521 fps step and policy inference: 6007 fps total: 5272 epoch: 547/1500\n",
            "fps step: 8939 fps step and policy inference: 7307 fps total: 6279 epoch: 548/1500\n",
            "fps step: 8468 fps step and policy inference: 6772 fps total: 5868 epoch: 549/1500\n",
            "fps step: 8623 fps step and policy inference: 6990 fps total: 6044 epoch: 550/1500\n",
            "fps step: 8662 fps step and policy inference: 7046 fps total: 6093 epoch: 551/1500\n",
            "fps step: 9038 fps step and policy inference: 7275 fps total: 6240 epoch: 552/1500\n",
            "fps step: 8844 fps step and policy inference: 7114 fps total: 6132 epoch: 553/1500\n",
            "fps step: 7672 fps step and policy inference: 6129 fps total: 5388 epoch: 554/1500\n",
            "fps step: 8864 fps step and policy inference: 7130 fps total: 6157 epoch: 555/1500\n",
            "fps step: 8733 fps step and policy inference: 6989 fps total: 6021 epoch: 556/1500\n",
            "fps step: 7664 fps step and policy inference: 6135 fps total: 5381 epoch: 557/1500\n",
            "fps step: 8381 fps step and policy inference: 6589 fps total: 5724 epoch: 558/1500\n",
            "fps step: 9978 fps step and policy inference: 7789 fps total: 6628 epoch: 559/1500\n",
            "fps step: 8910 fps step and policy inference: 7188 fps total: 6170 epoch: 560/1500\n",
            "fps step: 7010 fps step and policy inference: 5707 fps total: 5057 epoch: 561/1500\n",
            "fps step: 7614 fps step and policy inference: 6058 fps total: 5319 epoch: 562/1500\n",
            "fps step: 9817 fps step and policy inference: 7903 fps total: 6711 epoch: 563/1500\n",
            "fps step: 9628 fps step and policy inference: 7690 fps total: 6562 epoch: 564/1500\n",
            "fps step: 8814 fps step and policy inference: 6940 fps total: 5997 epoch: 565/1500\n",
            "fps step: 8477 fps step and policy inference: 6759 fps total: 5866 epoch: 566/1500\n",
            "fps step: 9032 fps step and policy inference: 7283 fps total: 6255 epoch: 567/1500\n",
            "fps step: 8766 fps step and policy inference: 7061 fps total: 6093 epoch: 568/1500\n",
            "fps step: 7527 fps step and policy inference: 6153 fps total: 5393 epoch: 569/1500\n",
            "fps step: 8420 fps step and policy inference: 6790 fps total: 5885 epoch: 570/1500\n",
            "fps step: 9162 fps step and policy inference: 7441 fps total: 6356 epoch: 571/1500\n",
            "fps step: 7687 fps step and policy inference: 6072 fps total: 5335 epoch: 572/1500\n",
            "fps step: 8524 fps step and policy inference: 6854 fps total: 5940 epoch: 573/1500\n",
            "fps step: 7455 fps step and policy inference: 5961 fps total: 5253 epoch: 574/1500\n",
            "saving next best rewards:  [64.38379]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8273 fps step and policy inference: 6525 fps total: 5694 epoch: 575/1500\n",
            "fps step: 9419 fps step and policy inference: 7625 fps total: 6507 epoch: 576/1500\n",
            "fps step: 7718 fps step and policy inference: 6303 fps total: 5519 epoch: 577/1500\n",
            "fps step: 9063 fps step and policy inference: 7238 fps total: 6236 epoch: 578/1500\n",
            "fps step: 8574 fps step and policy inference: 6858 fps total: 5926 epoch: 579/1500\n",
            "fps step: 9496 fps step and policy inference: 7551 fps total: 6454 epoch: 580/1500\n",
            "fps step: 9048 fps step and policy inference: 7217 fps total: 6200 epoch: 581/1500\n",
            "fps step: 9615 fps step and policy inference: 7694 fps total: 6559 epoch: 582/1500\n",
            "fps step: 8096 fps step and policy inference: 6525 fps total: 5689 epoch: 583/1500\n",
            "fps step: 8706 fps step and policy inference: 7006 fps total: 6060 epoch: 584/1500\n",
            "fps step: 8321 fps step and policy inference: 6704 fps total: 5807 epoch: 585/1500\n",
            "fps step: 9662 fps step and policy inference: 7866 fps total: 6683 epoch: 586/1500\n",
            "fps step: 8413 fps step and policy inference: 6887 fps total: 5967 epoch: 587/1500\n",
            "fps step: 9504 fps step and policy inference: 7556 fps total: 6458 epoch: 588/1500\n",
            "fps step: 9380 fps step and policy inference: 7582 fps total: 6477 epoch: 589/1500\n",
            "fps step: 8621 fps step and policy inference: 7021 fps total: 6063 epoch: 590/1500\n",
            "fps step: 8110 fps step and policy inference: 6694 fps total: 5816 epoch: 591/1500\n",
            "fps step: 9030 fps step and policy inference: 7198 fps total: 6195 epoch: 592/1500\n",
            "fps step: 9140 fps step and policy inference: 7420 fps total: 6357 epoch: 593/1500\n",
            "fps step: 9243 fps step and policy inference: 7465 fps total: 6390 epoch: 594/1500\n",
            "fps step: 8410 fps step and policy inference: 6738 fps total: 5822 epoch: 595/1500\n",
            "fps step: 9232 fps step and policy inference: 7404 fps total: 6350 epoch: 596/1500\n",
            "fps step: 9501 fps step and policy inference: 7690 fps total: 6557 epoch: 597/1500\n",
            "fps step: 7565 fps step and policy inference: 6069 fps total: 5307 epoch: 598/1500\n",
            "fps step: 8532 fps step and policy inference: 6876 fps total: 5954 epoch: 599/1500\n",
            "fps step: 7578 fps step and policy inference: 5972 fps total: 5267 epoch: 600/1500\n",
            "fps step: 9419 fps step and policy inference: 7525 fps total: 6435 epoch: 601/1500\n",
            "fps step: 9781 fps step and policy inference: 7877 fps total: 6669 epoch: 602/1500\n",
            "fps step: 10391 fps step and policy inference: 8312 fps total: 7001 epoch: 603/1500\n",
            "fps step: 8495 fps step and policy inference: 6757 fps total: 5864 epoch: 604/1500\n",
            "saving next best rewards:  [71.89007]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8581 fps step and policy inference: 6911 fps total: 5960 epoch: 605/1500\n",
            "fps step: 7514 fps step and policy inference: 5863 fps total: 5178 epoch: 606/1500\n",
            "fps step: 9110 fps step and policy inference: 7366 fps total: 6318 epoch: 607/1500\n",
            "fps step: 8648 fps step and policy inference: 6973 fps total: 6028 epoch: 608/1500\n",
            "fps step: 9223 fps step and policy inference: 7534 fps total: 6442 epoch: 609/1500\n",
            "fps step: 9446 fps step and policy inference: 7416 fps total: 6356 epoch: 610/1500\n",
            "fps step: 8702 fps step and policy inference: 6802 fps total: 5897 epoch: 611/1500\n",
            "fps step: 8484 fps step and policy inference: 6747 fps total: 5859 epoch: 612/1500\n",
            "fps step: 8425 fps step and policy inference: 6663 fps total: 5794 epoch: 613/1500\n",
            "fps step: 8589 fps step and policy inference: 6851 fps total: 5936 epoch: 614/1500\n",
            "fps step: 9111 fps step and policy inference: 7249 fps total: 6231 epoch: 615/1500\n",
            "fps step: 7837 fps step and policy inference: 6306 fps total: 5522 epoch: 616/1500\n",
            "fps step: 8963 fps step and policy inference: 7066 fps total: 6067 epoch: 617/1500\n",
            "fps step: 8741 fps step and policy inference: 6911 fps total: 5959 epoch: 618/1500\n",
            "fps step: 9315 fps step and policy inference: 7417 fps total: 6340 epoch: 619/1500\n",
            "fps step: 8873 fps step and policy inference: 7192 fps total: 6186 epoch: 620/1500\n",
            "fps step: 8877 fps step and policy inference: 7066 fps total: 6104 epoch: 621/1500\n",
            "fps step: 8612 fps step and policy inference: 6942 fps total: 6002 epoch: 622/1500\n",
            "fps step: 9717 fps step and policy inference: 7966 fps total: 6758 epoch: 623/1500\n",
            "fps step: 7870 fps step and policy inference: 6324 fps total: 5537 epoch: 624/1500\n",
            "fps step: 7166 fps step and policy inference: 5640 fps total: 5004 epoch: 625/1500\n",
            "fps step: 8713 fps step and policy inference: 7056 fps total: 6085 epoch: 626/1500\n",
            "fps step: 9435 fps step and policy inference: 7492 fps total: 6414 epoch: 627/1500\n",
            "fps step: 8265 fps step and policy inference: 6505 fps total: 5678 epoch: 628/1500\n",
            "fps step: 7673 fps step and policy inference: 6075 fps total: 5343 epoch: 629/1500\n",
            "fps step: 7991 fps step and policy inference: 6344 fps total: 5551 epoch: 630/1500\n",
            "fps step: 9066 fps step and policy inference: 7276 fps total: 6251 epoch: 631/1500\n",
            "fps step: 8372 fps step and policy inference: 6670 fps total: 5802 epoch: 632/1500\n",
            "fps step: 9506 fps step and policy inference: 7510 fps total: 6415 epoch: 633/1500\n",
            "fps step: 9661 fps step and policy inference: 7738 fps total: 6590 epoch: 634/1500\n",
            "fps step: 8498 fps step and policy inference: 6757 fps total: 5866 epoch: 635/1500\n",
            "fps step: 8188 fps step and policy inference: 6634 fps total: 5773 epoch: 636/1500\n",
            "fps step: 9468 fps step and policy inference: 7570 fps total: 6475 epoch: 637/1500\n",
            "fps step: 8921 fps step and policy inference: 7173 fps total: 6177 epoch: 638/1500\n",
            "fps step: 8945 fps step and policy inference: 7201 fps total: 6197 epoch: 639/1500\n",
            "fps step: 8899 fps step and policy inference: 7145 fps total: 6131 epoch: 640/1500\n",
            "fps step: 9375 fps step and policy inference: 7422 fps total: 6356 epoch: 641/1500\n",
            "fps step: 7011 fps step and policy inference: 5510 fps total: 4882 epoch: 642/1500\n",
            "fps step: 9032 fps step and policy inference: 7214 fps total: 6197 epoch: 643/1500\n",
            "fps step: 9488 fps step and policy inference: 7678 fps total: 6546 epoch: 644/1500\n",
            "fps step: 8668 fps step and policy inference: 6913 fps total: 5987 epoch: 645/1500\n",
            "fps step: 9185 fps step and policy inference: 7436 fps total: 6370 epoch: 646/1500\n",
            "fps step: 7887 fps step and policy inference: 6353 fps total: 5553 epoch: 647/1500\n",
            "fps step: 9760 fps step and policy inference: 7786 fps total: 6629 epoch: 648/1500\n",
            "fps step: 8064 fps step and policy inference: 6441 fps total: 5625 epoch: 649/1500\n",
            "fps step: 8362 fps step and policy inference: 6577 fps total: 5730 epoch: 650/1500\n",
            "fps step: 8477 fps step and policy inference: 6642 fps total: 5778 epoch: 651/1500\n",
            "fps step: 8797 fps step and policy inference: 7216 fps total: 6207 epoch: 652/1500\n",
            "fps step: 7860 fps step and policy inference: 6292 fps total: 5514 epoch: 653/1500\n",
            "fps step: 9091 fps step and policy inference: 7197 fps total: 6204 epoch: 654/1500\n",
            "fps step: 8999 fps step and policy inference: 7271 fps total: 6246 epoch: 655/1500\n",
            "fps step: 8943 fps step and policy inference: 7291 fps total: 6241 epoch: 656/1500\n",
            "fps step: 9433 fps step and policy inference: 7435 fps total: 6370 epoch: 657/1500\n",
            "fps step: 9315 fps step and policy inference: 7477 fps total: 6400 epoch: 658/1500\n",
            "fps step: 8077 fps step and policy inference: 6472 fps total: 5649 epoch: 659/1500\n",
            "fps step: 8154 fps step and policy inference: 6483 fps total: 5642 epoch: 660/1500\n",
            "fps step: 9816 fps step and policy inference: 7940 fps total: 6734 epoch: 661/1500\n",
            "fps step: 8360 fps step and policy inference: 6594 fps total: 5735 epoch: 662/1500\n",
            "fps step: 8366 fps step and policy inference: 6673 fps total: 5805 epoch: 663/1500\n",
            "fps step: 9845 fps step and policy inference: 7845 fps total: 6667 epoch: 664/1500\n",
            "fps step: 9456 fps step and policy inference: 7577 fps total: 6475 epoch: 665/1500\n",
            "fps step: 9954 fps step and policy inference: 7991 fps total: 6772 epoch: 666/1500\n",
            "fps step: 8594 fps step and policy inference: 6876 fps total: 5964 epoch: 667/1500\n",
            "fps step: 9736 fps step and policy inference: 7911 fps total: 6719 epoch: 668/1500\n",
            "fps step: 8541 fps step and policy inference: 7033 fps total: 6056 epoch: 669/1500\n",
            "fps step: 8396 fps step and policy inference: 6751 fps total: 5856 epoch: 670/1500\n",
            "fps step: 8605 fps step and policy inference: 6883 fps total: 5959 epoch: 671/1500\n",
            "fps step: 8839 fps step and policy inference: 7090 fps total: 6114 epoch: 672/1500\n",
            "fps step: 8511 fps step and policy inference: 6723 fps total: 5839 epoch: 673/1500\n",
            "fps step: 8033 fps step and policy inference: 6450 fps total: 5630 epoch: 674/1500\n",
            "fps step: 10442 fps step and policy inference: 8376 fps total: 7047 epoch: 675/1500\n",
            "saving next best rewards:  [76.11868]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8875 fps step and policy inference: 6979 fps total: 6031 epoch: 676/1500\n",
            "fps step: 9246 fps step and policy inference: 7357 fps total: 6306 epoch: 677/1500\n",
            "fps step: 7980 fps step and policy inference: 6327 fps total: 5538 epoch: 678/1500\n",
            "fps step: 8674 fps step and policy inference: 6918 fps total: 5987 epoch: 679/1500\n",
            "fps step: 8968 fps step and policy inference: 7238 fps total: 6215 epoch: 680/1500\n",
            "fps step: 9565 fps step and policy inference: 7758 fps total: 6606 epoch: 681/1500\n",
            "fps step: 8555 fps step and policy inference: 6743 fps total: 5846 epoch: 682/1500\n",
            "fps step: 9919 fps step and policy inference: 7868 fps total: 6686 epoch: 683/1500\n",
            "fps step: 8820 fps step and policy inference: 7051 fps total: 6077 epoch: 684/1500\n",
            "fps step: 7856 fps step and policy inference: 6265 fps total: 5492 epoch: 685/1500\n",
            "fps step: 9279 fps step and policy inference: 7479 fps total: 6400 epoch: 686/1500\n",
            "fps step: 8129 fps step and policy inference: 6483 fps total: 5641 epoch: 687/1500\n",
            "saving next best rewards:  [78.45671]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8163 fps step and policy inference: 6368 fps total: 5567 epoch: 688/1500\n",
            "fps step: 7332 fps step and policy inference: 5722 fps total: 5068 epoch: 689/1500\n",
            "fps step: 9526 fps step and policy inference: 7623 fps total: 6506 epoch: 690/1500\n",
            "fps step: 7970 fps step and policy inference: 6258 fps total: 5485 epoch: 691/1500\n",
            "fps step: 9495 fps step and policy inference: 7672 fps total: 6533 epoch: 692/1500\n",
            "fps step: 7069 fps step and policy inference: 5690 fps total: 5038 epoch: 693/1500\n",
            "fps step: 7589 fps step and policy inference: 6062 fps total: 5334 epoch: 694/1500\n",
            "fps step: 8184 fps step and policy inference: 6406 fps total: 5596 epoch: 695/1500\n",
            "fps step: 10120 fps step and policy inference: 8132 fps total: 6876 epoch: 696/1500\n",
            "fps step: 8413 fps step and policy inference: 6603 fps total: 5747 epoch: 697/1500\n",
            "fps step: 9498 fps step and policy inference: 7667 fps total: 6538 epoch: 698/1500\n",
            "fps step: 10031 fps step and policy inference: 8101 fps total: 6852 epoch: 699/1500\n",
            "fps step: 9157 fps step and policy inference: 7204 fps total: 6203 epoch: 700/1500\n",
            "fps step: 9689 fps step and policy inference: 7819 fps total: 6654 epoch: 701/1500\n",
            "saving next best rewards:  [80.01203]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 9019 fps step and policy inference: 7063 fps total: 6091 epoch: 702/1500\n",
            "fps step: 9868 fps step and policy inference: 7952 fps total: 6745 epoch: 703/1500\n",
            "saving next best rewards:  [81.964355]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8962 fps step and policy inference: 7158 fps total: 6163 epoch: 704/1500\n",
            "fps step: 7809 fps step and policy inference: 6276 fps total: 5497 epoch: 705/1500\n",
            "fps step: 7155 fps step and policy inference: 5504 fps total: 4895 epoch: 706/1500\n",
            "fps step: 9776 fps step and policy inference: 7961 fps total: 6752 epoch: 707/1500\n",
            "fps step: 10044 fps step and policy inference: 8108 fps total: 6855 epoch: 708/1500\n",
            "fps step: 8895 fps step and policy inference: 7153 fps total: 6160 epoch: 709/1500\n",
            "fps step: 8444 fps step and policy inference: 6672 fps total: 5775 epoch: 710/1500\n",
            "fps step: 10145 fps step and policy inference: 8075 fps total: 6820 epoch: 711/1500\n",
            "fps step: 9060 fps step and policy inference: 7282 fps total: 6256 epoch: 712/1500\n",
            "fps step: 9621 fps step and policy inference: 7641 fps total: 6506 epoch: 713/1500\n",
            "fps step: 9219 fps step and policy inference: 7168 fps total: 6171 epoch: 714/1500\n",
            "fps step: 9157 fps step and policy inference: 7317 fps total: 6278 epoch: 715/1500\n",
            "fps step: 9256 fps step and policy inference: 7416 fps total: 6355 epoch: 716/1500\n",
            "fps step: 9598 fps step and policy inference: 7762 fps total: 6608 epoch: 717/1500\n",
            "fps step: 8847 fps step and policy inference: 7063 fps total: 6097 epoch: 718/1500\n",
            "fps step: 9888 fps step and policy inference: 7959 fps total: 6750 epoch: 719/1500\n",
            "saving next best rewards:  [82.52823]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8989 fps step and policy inference: 6921 fps total: 5987 epoch: 720/1500\n",
            "saving next best rewards:  [91.756035]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8317 fps step and policy inference: 6752 fps total: 5843 epoch: 721/1500\n",
            "fps step: 9268 fps step and policy inference: 7534 fps total: 6441 epoch: 722/1500\n",
            "fps step: 8788 fps step and policy inference: 7108 fps total: 6127 epoch: 723/1500\n",
            "fps step: 9137 fps step and policy inference: 7259 fps total: 6240 epoch: 724/1500\n",
            "fps step: 9005 fps step and policy inference: 7345 fps total: 6291 epoch: 725/1500\n",
            "fps step: 9774 fps step and policy inference: 7681 fps total: 6549 epoch: 726/1500\n",
            "fps step: 8615 fps step and policy inference: 6899 fps total: 5950 epoch: 727/1500\n",
            "fps step: 7712 fps step and policy inference: 6094 fps total: 5360 epoch: 728/1500\n",
            "fps step: 8363 fps step and policy inference: 6669 fps total: 5803 epoch: 729/1500\n",
            "fps step: 8740 fps step and policy inference: 6934 fps total: 5996 epoch: 730/1500\n",
            "fps step: 8638 fps step and policy inference: 6834 fps total: 5923 epoch: 731/1500\n",
            "fps step: 8140 fps step and policy inference: 6446 fps total: 5629 epoch: 732/1500\n",
            "fps step: 8972 fps step and policy inference: 7074 fps total: 6068 epoch: 733/1500\n",
            "fps step: 9504 fps step and policy inference: 7578 fps total: 6474 epoch: 734/1500\n",
            "fps step: 9474 fps step and policy inference: 7615 fps total: 6501 epoch: 735/1500\n",
            "fps step: 8663 fps step and policy inference: 6930 fps total: 5997 epoch: 736/1500\n",
            "fps step: 9206 fps step and policy inference: 7469 fps total: 6393 epoch: 737/1500\n",
            "fps step: 8926 fps step and policy inference: 7136 fps total: 6149 epoch: 738/1500\n",
            "fps step: 8462 fps step and policy inference: 6710 fps total: 5830 epoch: 739/1500\n",
            "fps step: 8597 fps step and policy inference: 6901 fps total: 5974 epoch: 740/1500\n",
            "fps step: 9923 fps step and policy inference: 7944 fps total: 6740 epoch: 741/1500\n",
            "fps step: 10468 fps step and policy inference: 8361 fps total: 7036 epoch: 742/1500\n",
            "fps step: 9497 fps step and policy inference: 7557 fps total: 6440 epoch: 743/1500\n",
            "fps step: 9924 fps step and policy inference: 7831 fps total: 6651 epoch: 744/1500\n",
            "fps step: 8569 fps step and policy inference: 6817 fps total: 5906 epoch: 745/1500\n",
            "fps step: 7559 fps step and policy inference: 5877 fps total: 5191 epoch: 746/1500\n",
            "fps step: 9606 fps step and policy inference: 7576 fps total: 6480 epoch: 747/1500\n",
            "fps step: 10050 fps step and policy inference: 7850 fps total: 6665 epoch: 748/1500\n",
            "fps step: 8416 fps step and policy inference: 6896 fps total: 5963 epoch: 749/1500\n",
            "fps step: 8620 fps step and policy inference: 6831 fps total: 5913 epoch: 750/1500\n",
            "fps step: 9506 fps step and policy inference: 7563 fps total: 6462 epoch: 751/1500\n",
            "fps step: 8062 fps step and policy inference: 6463 fps total: 5645 epoch: 752/1500\n",
            "fps step: 9264 fps step and policy inference: 7428 fps total: 6365 epoch: 753/1500\n",
            "fps step: 9859 fps step and policy inference: 7910 fps total: 6722 epoch: 754/1500\n",
            "fps step: 9141 fps step and policy inference: 7316 fps total: 6284 epoch: 755/1500\n",
            "fps step: 9794 fps step and policy inference: 7758 fps total: 6605 epoch: 756/1500\n",
            "fps step: 7835 fps step and policy inference: 6260 fps total: 5495 epoch: 757/1500\n",
            "fps step: 8180 fps step and policy inference: 6551 fps total: 5712 epoch: 758/1500\n",
            "fps step: 9355 fps step and policy inference: 7536 fps total: 6442 epoch: 759/1500\n",
            "fps step: 9595 fps step and policy inference: 7608 fps total: 6489 epoch: 760/1500\n",
            "fps step: 8631 fps step and policy inference: 6891 fps total: 5951 epoch: 761/1500\n",
            "fps step: 8862 fps step and policy inference: 7018 fps total: 6060 epoch: 762/1500\n",
            "fps step: 8122 fps step and policy inference: 6370 fps total: 5574 epoch: 763/1500\n",
            "fps step: 9466 fps step and policy inference: 7599 fps total: 6489 epoch: 764/1500\n",
            "fps step: 8462 fps step and policy inference: 6618 fps total: 5766 epoch: 765/1500\n",
            "fps step: 7340 fps step and policy inference: 5634 fps total: 4997 epoch: 766/1500\n",
            "fps step: 9320 fps step and policy inference: 7375 fps total: 6323 epoch: 767/1500\n",
            "fps step: 9522 fps step and policy inference: 7736 fps total: 6591 epoch: 768/1500\n",
            "fps step: 8768 fps step and policy inference: 6950 fps total: 6021 epoch: 769/1500\n",
            "fps step: 9522 fps step and policy inference: 7569 fps total: 6466 epoch: 770/1500\n",
            "fps step: 9204 fps step and policy inference: 7242 fps total: 6215 epoch: 771/1500\n",
            "fps step: 8819 fps step and policy inference: 7091 fps total: 6113 epoch: 772/1500\n",
            "fps step: 10970 fps step and policy inference: 8753 fps total: 7312 epoch: 773/1500\n",
            "fps step: 9941 fps step and policy inference: 8000 fps total: 6780 epoch: 774/1500\n",
            "fps step: 8922 fps step and policy inference: 7115 fps total: 6129 epoch: 775/1500\n",
            "fps step: 8590 fps step and policy inference: 6827 fps total: 5916 epoch: 776/1500\n",
            "fps step: 9214 fps step and policy inference: 7269 fps total: 6223 epoch: 777/1500\n",
            "fps step: 9427 fps step and policy inference: 7508 fps total: 6427 epoch: 778/1500\n",
            "fps step: 8574 fps step and policy inference: 6912 fps total: 5984 epoch: 779/1500\n",
            "fps step: 10033 fps step and policy inference: 8013 fps total: 6789 epoch: 780/1500\n",
            "fps step: 9242 fps step and policy inference: 7494 fps total: 6413 epoch: 781/1500\n",
            "fps step: 8334 fps step and policy inference: 6600 fps total: 5747 epoch: 782/1500\n",
            "fps step: 10185 fps step and policy inference: 8143 fps total: 6855 epoch: 783/1500\n",
            "fps step: 9767 fps step and policy inference: 7819 fps total: 6650 epoch: 784/1500\n",
            "fps step: 10132 fps step and policy inference: 8034 fps total: 6804 epoch: 785/1500\n",
            "fps step: 10114 fps step and policy inference: 8052 fps total: 6807 epoch: 786/1500\n",
            "fps step: 9106 fps step and policy inference: 7204 fps total: 6195 epoch: 787/1500\n",
            "fps step: 8841 fps step and policy inference: 6978 fps total: 6031 epoch: 788/1500\n",
            "fps step: 7982 fps step and policy inference: 6301 fps total: 5521 epoch: 789/1500\n",
            "fps step: 9088 fps step and policy inference: 7165 fps total: 6178 epoch: 790/1500\n",
            "fps step: 8812 fps step and policy inference: 7063 fps total: 6082 epoch: 791/1500\n",
            "fps step: 9068 fps step and policy inference: 7169 fps total: 6174 epoch: 792/1500\n",
            "fps step: 8958 fps step and policy inference: 7242 fps total: 6228 epoch: 793/1500\n",
            "fps step: 9176 fps step and policy inference: 7271 fps total: 6248 epoch: 794/1500\n",
            "fps step: 10025 fps step and policy inference: 8013 fps total: 6789 epoch: 795/1500\n",
            "fps step: 9692 fps step and policy inference: 7659 fps total: 6529 epoch: 796/1500\n",
            "fps step: 8618 fps step and policy inference: 6783 fps total: 5884 epoch: 797/1500\n",
            "fps step: 8676 fps step and policy inference: 6890 fps total: 5970 epoch: 798/1500\n",
            "fps step: 8802 fps step and policy inference: 6970 fps total: 6028 epoch: 799/1500\n",
            "fps step: 9480 fps step and policy inference: 7632 fps total: 6510 epoch: 800/1500\n",
            "fps step: 8361 fps step and policy inference: 6532 fps total: 5699 epoch: 801/1500\n",
            "fps step: 10353 fps step and policy inference: 8232 fps total: 6952 epoch: 802/1500\n",
            "fps step: 9254 fps step and policy inference: 7322 fps total: 6266 epoch: 803/1500\n",
            "fps step: 9839 fps step and policy inference: 7857 fps total: 6675 epoch: 804/1500\n",
            "fps step: 9514 fps step and policy inference: 7582 fps total: 6454 epoch: 805/1500\n",
            "fps step: 8123 fps step and policy inference: 6314 fps total: 5526 epoch: 806/1500\n",
            "fps step: 10719 fps step and policy inference: 8477 fps total: 7128 epoch: 807/1500\n",
            "fps step: 10095 fps step and policy inference: 8135 fps total: 6874 epoch: 808/1500\n",
            "fps step: 9042 fps step and policy inference: 7203 fps total: 6201 epoch: 809/1500\n",
            "fps step: 8732 fps step and policy inference: 7060 fps total: 6091 epoch: 810/1500\n",
            "fps step: 8336 fps step and policy inference: 6641 fps total: 5782 epoch: 811/1500\n",
            "fps step: 8655 fps step and policy inference: 6952 fps total: 6013 epoch: 812/1500\n",
            "fps step: 9706 fps step and policy inference: 7732 fps total: 6586 epoch: 813/1500\n",
            "fps step: 9768 fps step and policy inference: 7753 fps total: 6609 epoch: 814/1500\n",
            "fps step: 9828 fps step and policy inference: 7963 fps total: 6751 epoch: 815/1500\n",
            "fps step: 9226 fps step and policy inference: 7288 fps total: 6238 epoch: 816/1500\n",
            "fps step: 10355 fps step and policy inference: 8267 fps total: 6979 epoch: 817/1500\n",
            "fps step: 9513 fps step and policy inference: 7591 fps total: 6483 epoch: 818/1500\n",
            "fps step: 9776 fps step and policy inference: 7802 fps total: 6640 epoch: 819/1500\n",
            "fps step: 9075 fps step and policy inference: 7147 fps total: 6156 epoch: 820/1500\n",
            "fps step: 10824 fps step and policy inference: 8586 fps total: 7194 epoch: 821/1500\n",
            "fps step: 9203 fps step and policy inference: 7363 fps total: 6315 epoch: 822/1500\n",
            "fps step: 8988 fps step and policy inference: 6977 fps total: 6025 epoch: 823/1500\n",
            "fps step: 9607 fps step and policy inference: 7517 fps total: 6429 epoch: 824/1500\n",
            "fps step: 9716 fps step and policy inference: 7649 fps total: 6527 epoch: 825/1500\n",
            "fps step: 10036 fps step and policy inference: 7994 fps total: 6774 epoch: 826/1500\n",
            "fps step: 7920 fps step and policy inference: 6321 fps total: 5533 epoch: 827/1500\n",
            "fps step: 8693 fps step and policy inference: 6934 fps total: 5999 epoch: 828/1500\n",
            "fps step: 8589 fps step and policy inference: 6818 fps total: 5912 epoch: 829/1500\n",
            "fps step: 8079 fps step and policy inference: 6404 fps total: 5605 epoch: 830/1500\n",
            "fps step: 9011 fps step and policy inference: 7214 fps total: 6206 epoch: 831/1500\n",
            "fps step: 8482 fps step and policy inference: 6737 fps total: 5852 epoch: 832/1500\n",
            "fps step: 8894 fps step and policy inference: 6954 fps total: 6002 epoch: 833/1500\n",
            "fps step: 8273 fps step and policy inference: 6409 fps total: 5600 epoch: 834/1500\n",
            "fps step: 9843 fps step and policy inference: 7942 fps total: 6738 epoch: 835/1500\n",
            "fps step: 9125 fps step and policy inference: 7136 fps total: 6146 epoch: 836/1500\n",
            "fps step: 9485 fps step and policy inference: 7584 fps total: 6480 epoch: 837/1500\n",
            "fps step: 9824 fps step and policy inference: 7720 fps total: 6582 epoch: 838/1500\n",
            "fps step: 8264 fps step and policy inference: 6549 fps total: 5690 epoch: 839/1500\n",
            "fps step: 9821 fps step and policy inference: 7873 fps total: 6695 epoch: 840/1500\n",
            "fps step: 9147 fps step and policy inference: 7230 fps total: 6217 epoch: 841/1500\n",
            "fps step: 9356 fps step and policy inference: 7540 fps total: 6443 epoch: 842/1500\n",
            "fps step: 9245 fps step and policy inference: 7482 fps total: 6409 epoch: 843/1500\n",
            "fps step: 9343 fps step and policy inference: 7351 fps total: 6306 epoch: 844/1500\n",
            "fps step: 9690 fps step and policy inference: 7770 fps total: 6613 epoch: 845/1500\n",
            "fps step: 9599 fps step and policy inference: 7615 fps total: 6500 epoch: 846/1500\n",
            "saving next best rewards:  [92.32931]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 9040 fps step and policy inference: 7117 fps total: 6133 epoch: 847/1500\n",
            "fps step: 10428 fps step and policy inference: 8168 fps total: 6900 epoch: 848/1500\n",
            "saving next best rewards:  [96.85858]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 9525 fps step and policy inference: 7410 fps total: 6330 epoch: 849/1500\n",
            "fps step: 10140 fps step and policy inference: 8028 fps total: 6802 epoch: 850/1500\n",
            "fps step: 8785 fps step and policy inference: 6964 fps total: 6006 epoch: 851/1500\n",
            "fps step: 10268 fps step and policy inference: 8158 fps total: 6891 epoch: 852/1500\n",
            "fps step: 7966 fps step and policy inference: 6383 fps total: 5581 epoch: 853/1500\n",
            "fps step: 9682 fps step and policy inference: 7660 fps total: 6532 epoch: 854/1500\n",
            "fps step: 9539 fps step and policy inference: 7637 fps total: 6521 epoch: 855/1500\n",
            "fps step: 9770 fps step and policy inference: 7735 fps total: 6573 epoch: 856/1500\n",
            "fps step: 7558 fps step and policy inference: 5979 fps total: 5255 epoch: 857/1500\n",
            "fps step: 9180 fps step and policy inference: 7130 fps total: 6139 epoch: 858/1500\n",
            "fps step: 8710 fps step and policy inference: 6892 fps total: 5966 epoch: 859/1500\n",
            "fps step: 9261 fps step and policy inference: 7327 fps total: 6291 epoch: 860/1500\n",
            "fps step: 8945 fps step and policy inference: 7063 fps total: 6186 epoch: 861/1500\n",
            "fps step: 8849 fps step and policy inference: 7054 fps total: 6095 epoch: 862/1500\n",
            "fps step: 8244 fps step and policy inference: 6527 fps total: 5690 epoch: 863/1500\n",
            "fps step: 9803 fps step and policy inference: 7748 fps total: 6597 epoch: 864/1500\n",
            "fps step: 9114 fps step and policy inference: 7175 fps total: 6181 epoch: 865/1500\n",
            "fps step: 9222 fps step and policy inference: 7252 fps total: 6239 epoch: 866/1500\n",
            "fps step: 9755 fps step and policy inference: 7835 fps total: 6666 epoch: 867/1500\n",
            "fps step: 9744 fps step and policy inference: 7722 fps total: 6578 epoch: 868/1500\n",
            "fps step: 9270 fps step and policy inference: 7383 fps total: 6331 epoch: 869/1500\n",
            "fps step: 9701 fps step and policy inference: 7696 fps total: 6565 epoch: 870/1500\n",
            "fps step: 7485 fps step and policy inference: 5791 fps total: 5122 epoch: 871/1500\n",
            "fps step: 10483 fps step and policy inference: 8300 fps total: 6995 epoch: 872/1500\n",
            "fps step: 10593 fps step and policy inference: 8432 fps total: 7086 epoch: 873/1500\n",
            "saving next best rewards:  [101.07825]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 8644 fps step and policy inference: 6819 fps total: 5911 epoch: 874/1500\n",
            "fps step: 8294 fps step and policy inference: 6554 fps total: 5712 epoch: 875/1500\n",
            "fps step: 9520 fps step and policy inference: 7534 fps total: 6426 epoch: 876/1500\n",
            "fps step: 9624 fps step and policy inference: 7546 fps total: 6451 epoch: 877/1500\n",
            "fps step: 9013 fps step and policy inference: 7285 fps total: 6259 epoch: 878/1500\n",
            "fps step: 9348 fps step and policy inference: 7484 fps total: 6406 epoch: 879/1500\n",
            "fps step: 9050 fps step and policy inference: 7109 fps total: 6127 epoch: 880/1500\n",
            "fps step: 9486 fps step and policy inference: 7464 fps total: 6389 epoch: 881/1500\n",
            "fps step: 10292 fps step and policy inference: 8244 fps total: 6925 epoch: 882/1500\n",
            "fps step: 9398 fps step and policy inference: 7362 fps total: 6309 epoch: 883/1500\n",
            "fps step: 10215 fps step and policy inference: 8053 fps total: 6811 epoch: 884/1500\n",
            "fps step: 9257 fps step and policy inference: 7368 fps total: 6306 epoch: 885/1500\n",
            "fps step: 10071 fps step and policy inference: 8015 fps total: 6790 epoch: 886/1500\n",
            "fps step: 9119 fps step and policy inference: 7062 fps total: 6089 epoch: 887/1500\n",
            "fps step: 9032 fps step and policy inference: 7198 fps total: 6189 epoch: 888/1500\n",
            "fps step: 10041 fps step and policy inference: 7934 fps total: 6731 epoch: 889/1500\n",
            "fps step: 9776 fps step and policy inference: 7787 fps total: 6626 epoch: 890/1500\n",
            "fps step: 10257 fps step and policy inference: 7971 fps total: 6753 epoch: 891/1500\n",
            "fps step: 8461 fps step and policy inference: 6564 fps total: 5721 epoch: 892/1500\n",
            "fps step: 8563 fps step and policy inference: 6786 fps total: 5893 epoch: 893/1500\n",
            "fps step: 8815 fps step and policy inference: 6925 fps total: 5990 epoch: 894/1500\n",
            "fps step: 9248 fps step and policy inference: 7372 fps total: 6330 epoch: 895/1500\n",
            "fps step: 8965 fps step and policy inference: 7017 fps total: 6057 epoch: 896/1500\n",
            "fps step: 8797 fps step and policy inference: 7023 fps total: 6061 epoch: 897/1500\n",
            "fps step: 10096 fps step and policy inference: 8115 fps total: 6855 epoch: 898/1500\n",
            "fps step: 10843 fps step and policy inference: 8608 fps total: 7216 epoch: 899/1500\n",
            "fps step: 10188 fps step and policy inference: 8073 fps total: 6831 epoch: 900/1500\n",
            "fps step: 9566 fps step and policy inference: 7698 fps total: 6562 epoch: 901/1500\n",
            "fps step: 8999 fps step and policy inference: 7183 fps total: 6182 epoch: 902/1500\n",
            "fps step: 10054 fps step and policy inference: 8041 fps total: 6810 epoch: 903/1500\n",
            "fps step: 9802 fps step and policy inference: 7876 fps total: 6690 epoch: 904/1500\n",
            "fps step: 8499 fps step and policy inference: 6831 fps total: 5912 epoch: 905/1500\n",
            "fps step: 9708 fps step and policy inference: 7842 fps total: 6665 epoch: 906/1500\n",
            "fps step: 9387 fps step and policy inference: 7518 fps total: 6429 epoch: 907/1500\n",
            "fps step: 9024 fps step and policy inference: 7246 fps total: 6227 epoch: 908/1500\n",
            "fps step: 9514 fps step and policy inference: 7507 fps total: 6422 epoch: 909/1500\n",
            "fps step: 10242 fps step and policy inference: 8106 fps total: 6856 epoch: 910/1500\n",
            "fps step: 10285 fps step and policy inference: 8059 fps total: 6810 epoch: 911/1500\n",
            "fps step: 10707 fps step and policy inference: 8484 fps total: 7124 epoch: 912/1500\n",
            "fps step: 10104 fps step and policy inference: 8038 fps total: 6780 epoch: 913/1500\n",
            "fps step: 9756 fps step and policy inference: 7647 fps total: 6522 epoch: 914/1500\n",
            "fps step: 9865 fps step and policy inference: 7898 fps total: 6705 epoch: 915/1500\n",
            "fps step: 9077 fps step and policy inference: 7351 fps total: 6287 epoch: 916/1500\n",
            "fps step: 9931 fps step and policy inference: 7976 fps total: 6761 epoch: 917/1500\n",
            "fps step: 9133 fps step and policy inference: 7362 fps total: 6314 epoch: 918/1500\n",
            "fps step: 9070 fps step and policy inference: 7203 fps total: 6199 epoch: 919/1500\n",
            "fps step: 9607 fps step and policy inference: 7683 fps total: 6551 epoch: 920/1500\n",
            "fps step: 9215 fps step and policy inference: 7435 fps total: 6370 epoch: 921/1500\n",
            "fps step: 9505 fps step and policy inference: 7517 fps total: 6415 epoch: 922/1500\n",
            "fps step: 10072 fps step and policy inference: 8069 fps total: 6829 epoch: 923/1500\n",
            "fps step: 8055 fps step and policy inference: 6261 fps total: 5488 epoch: 924/1500\n",
            "fps step: 8263 fps step and policy inference: 6617 fps total: 5758 epoch: 925/1500\n",
            "fps step: 10141 fps step and policy inference: 8004 fps total: 6789 epoch: 926/1500\n",
            "fps step: 10038 fps step and policy inference: 7938 fps total: 6738 epoch: 927/1500\n",
            "fps step: 9555 fps step and policy inference: 7478 fps total: 6404 epoch: 928/1500\n",
            "fps step: 10842 fps step and policy inference: 8559 fps total: 7182 epoch: 929/1500\n",
            "fps step: 10298 fps step and policy inference: 8167 fps total: 6908 epoch: 930/1500\n",
            "fps step: 8552 fps step and policy inference: 6920 fps total: 5972 epoch: 931/1500\n",
            "fps step: 8706 fps step and policy inference: 6918 fps total: 5970 epoch: 932/1500\n",
            "fps step: 8625 fps step and policy inference: 6840 fps total: 5928 epoch: 933/1500\n",
            "fps step: 10042 fps step and policy inference: 8014 fps total: 6772 epoch: 934/1500\n",
            "fps step: 9812 fps step and policy inference: 7802 fps total: 6637 epoch: 935/1500\n",
            "fps step: 9014 fps step and policy inference: 7237 fps total: 6222 epoch: 936/1500\n",
            "fps step: 9379 fps step and policy inference: 7331 fps total: 6284 epoch: 937/1500\n",
            "fps step: 9678 fps step and policy inference: 7625 fps total: 6505 epoch: 938/1500\n",
            "fps step: 7909 fps step and policy inference: 6158 fps total: 5406 epoch: 939/1500\n",
            "fps step: 9877 fps step and policy inference: 7944 fps total: 6740 epoch: 940/1500\n",
            "fps step: 9934 fps step and policy inference: 7886 fps total: 6699 epoch: 941/1500\n",
            "fps step: 9035 fps step and policy inference: 7102 fps total: 6123 epoch: 942/1500\n",
            "fps step: 8898 fps step and policy inference: 7042 fps total: 6083 epoch: 943/1500\n",
            "fps step: 7877 fps step and policy inference: 6158 fps total: 5391 epoch: 944/1500\n",
            "fps step: 9885 fps step and policy inference: 7782 fps total: 6615 epoch: 945/1500\n",
            "fps step: 9805 fps step and policy inference: 7838 fps total: 6663 epoch: 946/1500\n",
            "fps step: 8823 fps step and policy inference: 7164 fps total: 6170 epoch: 947/1500\n",
            "fps step: 9433 fps step and policy inference: 7599 fps total: 6490 epoch: 948/1500\n",
            "fps step: 10049 fps step and policy inference: 8092 fps total: 6825 epoch: 949/1500\n",
            "fps step: 9699 fps step and policy inference: 7857 fps total: 6677 epoch: 950/1500\n",
            "fps step: 9953 fps step and policy inference: 8006 fps total: 6786 epoch: 951/1500\n",
            "fps step: 10328 fps step and policy inference: 8232 fps total: 6946 epoch: 952/1500\n",
            "fps step: 8166 fps step and policy inference: 6319 fps total: 5535 epoch: 953/1500\n",
            "fps step: 10453 fps step and policy inference: 8178 fps total: 6907 epoch: 954/1500\n",
            "fps step: 8423 fps step and policy inference: 6543 fps total: 5702 epoch: 955/1500\n",
            "fps step: 11318 fps step and policy inference: 8963 fps total: 7431 epoch: 956/1500\n",
            "fps step: 10183 fps step and policy inference: 8084 fps total: 6840 epoch: 957/1500\n",
            "fps step: 9741 fps step and policy inference: 7682 fps total: 6549 epoch: 958/1500\n",
            "fps step: 9367 fps step and policy inference: 7414 fps total: 6355 epoch: 959/1500\n",
            "fps step: 10213 fps step and policy inference: 8037 fps total: 6821 epoch: 960/1500\n",
            "fps step: 8700 fps step and policy inference: 6904 fps total: 5975 epoch: 961/1500\n",
            "fps step: 8828 fps step and policy inference: 7026 fps total: 6067 epoch: 962/1500\n",
            "fps step: 9819 fps step and policy inference: 7733 fps total: 6588 epoch: 963/1500\n",
            "fps step: 8202 fps step and policy inference: 6565 fps total: 5712 epoch: 964/1500\n",
            "fps step: 10033 fps step and policy inference: 7960 fps total: 6751 epoch: 965/1500\n",
            "fps step: 9019 fps step and policy inference: 7121 fps total: 6114 epoch: 966/1500\n",
            "fps step: 9847 fps step and policy inference: 7719 fps total: 6581 epoch: 967/1500\n",
            "fps step: 9029 fps step and policy inference: 7098 fps total: 6123 epoch: 968/1500\n",
            "fps step: 10433 fps step and policy inference: 8331 fps total: 6997 epoch: 969/1500\n",
            "fps step: 10988 fps step and policy inference: 8765 fps total: 7332 epoch: 970/1500\n",
            "fps step: 9145 fps step and policy inference: 7246 fps total: 6229 epoch: 971/1500\n",
            "fps step: 8249 fps step and policy inference: 6519 fps total: 5685 epoch: 972/1500\n",
            "fps step: 10215 fps step and policy inference: 8270 fps total: 6972 epoch: 973/1500\n",
            "fps step: 9487 fps step and policy inference: 7594 fps total: 6488 epoch: 974/1500\n",
            "fps step: 10533 fps step and policy inference: 8375 fps total: 7050 epoch: 975/1500\n",
            "fps step: 8098 fps step and policy inference: 6294 fps total: 5501 epoch: 976/1500\n",
            "fps step: 9675 fps step and policy inference: 7545 fps total: 6450 epoch: 977/1500\n",
            "fps step: 8963 fps step and policy inference: 7049 fps total: 6091 epoch: 978/1500\n",
            "fps step: 8936 fps step and policy inference: 7098 fps total: 6120 epoch: 979/1500\n",
            "fps step: 8474 fps step and policy inference: 6664 fps total: 5793 epoch: 980/1500\n",
            "fps step: 9071 fps step and policy inference: 7284 fps total: 6264 epoch: 981/1500\n",
            "fps step: 9019 fps step and policy inference: 7261 fps total: 6252 epoch: 982/1500\n",
            "fps step: 9980 fps step and policy inference: 7874 fps total: 6697 epoch: 983/1500\n",
            "fps step: 9121 fps step and policy inference: 7328 fps total: 6281 epoch: 984/1500\n",
            "fps step: 9425 fps step and policy inference: 7570 fps total: 6468 epoch: 985/1500\n",
            "fps step: 8075 fps step and policy inference: 6473 fps total: 5665 epoch: 986/1500\n",
            "fps step: 9762 fps step and policy inference: 7699 fps total: 6567 epoch: 987/1500\n",
            "fps step: 9216 fps step and policy inference: 7317 fps total: 6283 epoch: 988/1500\n",
            "fps step: 9073 fps step and policy inference: 7230 fps total: 6219 epoch: 989/1500\n",
            "fps step: 9756 fps step and policy inference: 7871 fps total: 6692 epoch: 990/1500\n",
            "fps step: 9747 fps step and policy inference: 7809 fps total: 6641 epoch: 991/1500\n",
            "fps step: 9417 fps step and policy inference: 7412 fps total: 6351 epoch: 992/1500\n",
            "fps step: 9522 fps step and policy inference: 7591 fps total: 6483 epoch: 993/1500\n",
            "fps step: 9473 fps step and policy inference: 7515 fps total: 6428 epoch: 994/1500\n",
            "fps step: 8745 fps step and policy inference: 6999 fps total: 6047 epoch: 995/1500\n",
            "fps step: 9284 fps step and policy inference: 7335 fps total: 6295 epoch: 996/1500\n",
            "fps step: 8394 fps step and policy inference: 6773 fps total: 5877 epoch: 997/1500\n",
            "fps step: 9941 fps step and policy inference: 7850 fps total: 6671 epoch: 998/1500\n",
            "fps step: 9118 fps step and policy inference: 7181 fps total: 6175 epoch: 999/1500\n",
            "fps step: 8240 fps step and policy inference: 6403 fps total: 5596 epoch: 1000/1500\n",
            "fps step: 9220 fps step and policy inference: 7364 fps total: 6316 epoch: 1001/1500\n",
            "fps step: 8445 fps step and policy inference: 6700 fps total: 5821 epoch: 1002/1500\n",
            "fps step: 10028 fps step and policy inference: 8024 fps total: 6798 epoch: 1003/1500\n",
            "fps step: 10727 fps step and policy inference: 8547 fps total: 7170 epoch: 1004/1500\n",
            "fps step: 9700 fps step and policy inference: 7669 fps total: 6553 epoch: 1005/1500\n",
            "fps step: 10638 fps step and policy inference: 8385 fps total: 7056 epoch: 1006/1500\n",
            "fps step: 8802 fps step and policy inference: 6898 fps total: 5971 epoch: 1007/1500\n",
            "fps step: 9496 fps step and policy inference: 7525 fps total: 6415 epoch: 1008/1500\n",
            "fps step: 8451 fps step and policy inference: 6737 fps total: 5848 epoch: 1009/1500\n",
            "fps step: 9066 fps step and policy inference: 7113 fps total: 6128 epoch: 1010/1500\n",
            "fps step: 9753 fps step and policy inference: 7883 fps total: 6697 epoch: 1011/1500\n",
            "fps step: 9123 fps step and policy inference: 7288 fps total: 6274 epoch: 1012/1500\n",
            "fps step: 11238 fps step and policy inference: 8968 fps total: 7467 epoch: 1013/1500\n",
            "fps step: 9110 fps step and policy inference: 7259 fps total: 6239 epoch: 1014/1500\n",
            "fps step: 8492 fps step and policy inference: 6625 fps total: 5765 epoch: 1015/1500\n",
            "fps step: 8746 fps step and policy inference: 6896 fps total: 5970 epoch: 1016/1500\n",
            "fps step: 8600 fps step and policy inference: 6828 fps total: 5919 epoch: 1017/1500\n",
            "fps step: 10808 fps step and policy inference: 8601 fps total: 7207 epoch: 1018/1500\n",
            "fps step: 10093 fps step and policy inference: 8067 fps total: 6824 epoch: 1019/1500\n",
            "fps step: 9430 fps step and policy inference: 7291 fps total: 6249 epoch: 1020/1500\n",
            "fps step: 10026 fps step and policy inference: 8042 fps total: 6792 epoch: 1021/1500\n",
            "fps step: 9349 fps step and policy inference: 7402 fps total: 6337 epoch: 1022/1500\n",
            "fps step: 9301 fps step and policy inference: 7429 fps total: 6366 epoch: 1023/1500\n",
            "fps step: 9404 fps step and policy inference: 7528 fps total: 6423 epoch: 1024/1500\n",
            "fps step: 7306 fps step and policy inference: 5668 fps total: 5005 epoch: 1025/1500\n",
            "fps step: 9759 fps step and policy inference: 7774 fps total: 6615 epoch: 1026/1500\n",
            "fps step: 9875 fps step and policy inference: 7860 fps total: 6678 epoch: 1027/1500\n",
            "fps step: 10001 fps step and policy inference: 7899 fps total: 6707 epoch: 1028/1500\n",
            "fps step: 10889 fps step and policy inference: 8710 fps total: 7280 epoch: 1029/1500\n",
            "fps step: 8350 fps step and policy inference: 6569 fps total: 5722 epoch: 1030/1500\n",
            "fps step: 9934 fps step and policy inference: 7901 fps total: 6710 epoch: 1031/1500\n",
            "fps step: 9766 fps step and policy inference: 7741 fps total: 6590 epoch: 1032/1500\n",
            "fps step: 10456 fps step and policy inference: 8309 fps total: 7006 epoch: 1033/1500\n",
            "fps step: 9466 fps step and policy inference: 7523 fps total: 6435 epoch: 1034/1500\n",
            "fps step: 8450 fps step and policy inference: 6558 fps total: 5719 epoch: 1035/1500\n",
            "fps step: 7865 fps step and policy inference: 6089 fps total: 5344 epoch: 1036/1500\n",
            "fps step: 8444 fps step and policy inference: 6562 fps total: 5717 epoch: 1037/1500\n",
            "fps step: 9160 fps step and policy inference: 7293 fps total: 6259 epoch: 1038/1500\n",
            "fps step: 9432 fps step and policy inference: 7634 fps total: 6516 epoch: 1039/1500\n",
            "fps step: 8415 fps step and policy inference: 6616 fps total: 5759 epoch: 1040/1500\n",
            "fps step: 10146 fps step and policy inference: 8013 fps total: 6786 epoch: 1041/1500\n",
            "fps step: 8802 fps step and policy inference: 6999 fps total: 6045 epoch: 1042/1500\n",
            "fps step: 9774 fps step and policy inference: 7858 fps total: 6677 epoch: 1043/1500\n",
            "fps step: 8740 fps step and policy inference: 6930 fps total: 5977 epoch: 1044/1500\n",
            "fps step: 9684 fps step and policy inference: 7749 fps total: 6588 epoch: 1045/1500\n",
            "fps step: 10577 fps step and policy inference: 8426 fps total: 7086 epoch: 1046/1500\n",
            "fps step: 9670 fps step and policy inference: 7694 fps total: 6567 epoch: 1047/1500\n",
            "fps step: 9299 fps step and policy inference: 7328 fps total: 6292 epoch: 1048/1500\n",
            "fps step: 9745 fps step and policy inference: 7751 fps total: 6613 epoch: 1049/1500\n",
            "fps step: 9829 fps step and policy inference: 7862 fps total: 6681 epoch: 1050/1500\n",
            "fps step: 8988 fps step and policy inference: 7158 fps total: 6165 epoch: 1051/1500\n",
            "fps step: 9287 fps step and policy inference: 7542 fps total: 6450 epoch: 1052/1500\n",
            "fps step: 9752 fps step and policy inference: 7717 fps total: 6575 epoch: 1053/1500\n",
            "fps step: 8910 fps step and policy inference: 7022 fps total: 6067 epoch: 1054/1500\n",
            "fps step: 9644 fps step and policy inference: 7652 fps total: 6528 epoch: 1055/1500\n",
            "fps step: 7902 fps step and policy inference: 6127 fps total: 5378 epoch: 1056/1500\n",
            "fps step: 8427 fps step and policy inference: 6660 fps total: 5794 epoch: 1057/1500\n",
            "fps step: 9033 fps step and policy inference: 7037 fps total: 6078 epoch: 1058/1500\n",
            "fps step: 8166 fps step and policy inference: 6538 fps total: 5699 epoch: 1059/1500\n",
            "fps step: 8988 fps step and policy inference: 7125 fps total: 6169 epoch: 1060/1500\n",
            "fps step: 9661 fps step and policy inference: 7606 fps total: 6497 epoch: 1061/1500\n",
            "fps step: 9127 fps step and policy inference: 7290 fps total: 6264 epoch: 1062/1500\n",
            "fps step: 9101 fps step and policy inference: 7279 fps total: 6256 epoch: 1063/1500\n",
            "fps step: 9328 fps step and policy inference: 7423 fps total: 6359 epoch: 1064/1500\n",
            "fps step: 8834 fps step and policy inference: 7100 fps total: 6109 epoch: 1065/1500\n",
            "fps step: 9155 fps step and policy inference: 7387 fps total: 6326 epoch: 1066/1500\n",
            "fps step: 8719 fps step and policy inference: 6861 fps total: 5944 epoch: 1067/1500\n",
            "fps step: 8105 fps step and policy inference: 6354 fps total: 5552 epoch: 1068/1500\n",
            "fps step: 9923 fps step and policy inference: 7889 fps total: 6705 epoch: 1069/1500\n",
            "fps step: 9010 fps step and policy inference: 7211 fps total: 6208 epoch: 1070/1500\n",
            "fps step: 9794 fps step and policy inference: 7917 fps total: 6720 epoch: 1071/1500\n",
            "fps step: 10636 fps step and policy inference: 8517 fps total: 7156 epoch: 1072/1500\n",
            "fps step: 8619 fps step and policy inference: 6764 fps total: 5881 epoch: 1073/1500\n",
            "fps step: 9892 fps step and policy inference: 7854 fps total: 6680 epoch: 1074/1500\n",
            "fps step: 9293 fps step and policy inference: 7284 fps total: 6259 epoch: 1075/1500\n",
            "fps step: 9691 fps step and policy inference: 7739 fps total: 6584 epoch: 1076/1500\n",
            "fps step: 9912 fps step and policy inference: 8008 fps total: 6788 epoch: 1077/1500\n",
            "fps step: 7492 fps step and policy inference: 5791 fps total: 5109 epoch: 1078/1500\n",
            "fps step: 8100 fps step and policy inference: 6296 fps total: 5512 epoch: 1079/1500\n",
            "fps step: 8995 fps step and policy inference: 7114 fps total: 6137 epoch: 1080/1500\n",
            "fps step: 10544 fps step and policy inference: 8386 fps total: 7055 epoch: 1081/1500\n",
            "fps step: 8536 fps step and policy inference: 6708 fps total: 5827 epoch: 1082/1500\n",
            "fps step: 8188 fps step and policy inference: 6550 fps total: 5709 epoch: 1083/1500\n",
            "fps step: 9272 fps step and policy inference: 7309 fps total: 6276 epoch: 1084/1500\n",
            "fps step: 9214 fps step and policy inference: 7296 fps total: 6268 epoch: 1085/1500\n",
            "fps step: 9995 fps step and policy inference: 7926 fps total: 6727 epoch: 1086/1500\n",
            "fps step: 10844 fps step and policy inference: 8466 fps total: 7092 epoch: 1087/1500\n",
            "fps step: 9938 fps step and policy inference: 8003 fps total: 6783 epoch: 1088/1500\n",
            "fps step: 11759 fps step and policy inference: 9282 fps total: 7655 epoch: 1089/1500\n",
            "fps step: 9423 fps step and policy inference: 7496 fps total: 6414 epoch: 1090/1500\n",
            "fps step: 10311 fps step and policy inference: 8157 fps total: 6882 epoch: 1091/1500\n",
            "fps step: 9018 fps step and policy inference: 7090 fps total: 6096 epoch: 1092/1500\n",
            "fps step: 9981 fps step and policy inference: 7848 fps total: 6648 epoch: 1093/1500\n",
            "fps step: 8629 fps step and policy inference: 6911 fps total: 5981 epoch: 1094/1500\n",
            "fps step: 8846 fps step and policy inference: 6967 fps total: 6007 epoch: 1095/1500\n",
            "fps step: 9849 fps step and policy inference: 7892 fps total: 6700 epoch: 1096/1500\n",
            "fps step: 10481 fps step and policy inference: 8231 fps total: 6933 epoch: 1097/1500\n",
            "fps step: 9500 fps step and policy inference: 7501 fps total: 6405 epoch: 1098/1500\n",
            "fps step: 10424 fps step and policy inference: 8167 fps total: 6898 epoch: 1099/1500\n",
            "fps step: 9344 fps step and policy inference: 7286 fps total: 6256 epoch: 1100/1500\n",
            "fps step: 9392 fps step and policy inference: 7421 fps total: 6358 epoch: 1101/1500\n",
            "fps step: 10718 fps step and policy inference: 8528 fps total: 7154 epoch: 1102/1500\n",
            "fps step: 10682 fps step and policy inference: 8449 fps total: 7099 epoch: 1103/1500\n",
            "fps step: 8923 fps step and policy inference: 7166 fps total: 6171 epoch: 1104/1500\n",
            "fps step: 9530 fps step and policy inference: 7535 fps total: 6440 epoch: 1105/1500\n",
            "fps step: 9470 fps step and policy inference: 7365 fps total: 6319 epoch: 1106/1500\n",
            "fps step: 9862 fps step and policy inference: 7733 fps total: 6592 epoch: 1107/1500\n",
            "fps step: 9508 fps step and policy inference: 7614 fps total: 6501 epoch: 1108/1500\n",
            "fps step: 8628 fps step and policy inference: 6734 fps total: 5832 epoch: 1109/1500\n",
            "fps step: 8824 fps step and policy inference: 6941 fps total: 6004 epoch: 1110/1500\n",
            "fps step: 10549 fps step and policy inference: 8326 fps total: 7011 epoch: 1111/1500\n",
            "fps step: 9433 fps step and policy inference: 7470 fps total: 6394 epoch: 1112/1500\n",
            "fps step: 9173 fps step and policy inference: 7287 fps total: 6260 epoch: 1113/1500\n",
            "fps step: 9092 fps step and policy inference: 7183 fps total: 6186 epoch: 1114/1500\n",
            "fps step: 9998 fps step and policy inference: 7971 fps total: 6745 epoch: 1115/1500\n",
            "fps step: 8626 fps step and policy inference: 6792 fps total: 5892 epoch: 1116/1500\n",
            "fps step: 9748 fps step and policy inference: 7804 fps total: 6638 epoch: 1117/1500\n",
            "fps step: 9526 fps step and policy inference: 7679 fps total: 6543 epoch: 1118/1500\n",
            "fps step: 9962 fps step and policy inference: 7803 fps total: 6633 epoch: 1119/1500\n",
            "fps step: 8332 fps step and policy inference: 6610 fps total: 5754 epoch: 1120/1500\n",
            "fps step: 9952 fps step and policy inference: 7939 fps total: 6737 epoch: 1121/1500\n",
            "fps step: 9887 fps step and policy inference: 7828 fps total: 6637 epoch: 1122/1500\n",
            "fps step: 10545 fps step and policy inference: 8403 fps total: 7065 epoch: 1123/1500\n",
            "fps step: 10271 fps step and policy inference: 8141 fps total: 6880 epoch: 1124/1500\n",
            "fps step: 9991 fps step and policy inference: 7902 fps total: 6709 epoch: 1125/1500\n",
            "fps step: 9694 fps step and policy inference: 7688 fps total: 6557 epoch: 1126/1500\n",
            "fps step: 10449 fps step and policy inference: 8386 fps total: 7029 epoch: 1127/1500\n",
            "fps step: 8071 fps step and policy inference: 6315 fps total: 5533 epoch: 1128/1500\n",
            "fps step: 10305 fps step and policy inference: 8238 fps total: 6961 epoch: 1129/1500\n",
            "fps step: 8148 fps step and policy inference: 6573 fps total: 5727 epoch: 1130/1500\n",
            "fps step: 8489 fps step and policy inference: 6714 fps total: 5833 epoch: 1131/1500\n",
            "fps step: 8743 fps step and policy inference: 6886 fps total: 5966 epoch: 1132/1500\n",
            "fps step: 9259 fps step and policy inference: 7467 fps total: 6378 epoch: 1133/1500\n",
            "fps step: 8982 fps step and policy inference: 7070 fps total: 6100 epoch: 1134/1500\n",
            "fps step: 9705 fps step and policy inference: 7748 fps total: 6597 epoch: 1135/1500\n",
            "fps step: 9863 fps step and policy inference: 7809 fps total: 6639 epoch: 1136/1500\n",
            "fps step: 9206 fps step and policy inference: 7251 fps total: 6234 epoch: 1137/1500\n",
            "fps step: 10368 fps step and policy inference: 8197 fps total: 6902 epoch: 1138/1500\n",
            "fps step: 9180 fps step and policy inference: 7280 fps total: 6255 epoch: 1139/1500\n",
            "fps step: 10895 fps step and policy inference: 8589 fps total: 7198 epoch: 1140/1500\n",
            "fps step: 10178 fps step and policy inference: 8200 fps total: 6923 epoch: 1141/1500\n",
            "fps step: 9619 fps step and policy inference: 7523 fps total: 6429 epoch: 1142/1500\n",
            "fps step: 9375 fps step and policy inference: 7534 fps total: 6447 epoch: 1143/1500\n",
            "fps step: 9679 fps step and policy inference: 7646 fps total: 6525 epoch: 1144/1500\n",
            "fps step: 9947 fps step and policy inference: 7802 fps total: 6613 epoch: 1145/1500\n",
            "fps step: 9830 fps step and policy inference: 7795 fps total: 6628 epoch: 1146/1500\n",
            "fps step: 10580 fps step and policy inference: 8479 fps total: 7123 epoch: 1147/1500\n",
            "fps step: 9410 fps step and policy inference: 7468 fps total: 6393 epoch: 1148/1500\n",
            "fps step: 10484 fps step and policy inference: 8268 fps total: 6977 epoch: 1149/1500\n",
            "fps step: 9019 fps step and policy inference: 7092 fps total: 6118 epoch: 1150/1500\n",
            "fps step: 9211 fps step and policy inference: 7352 fps total: 6309 epoch: 1151/1500\n",
            "fps step: 9474 fps step and policy inference: 7531 fps total: 6439 epoch: 1152/1500\n",
            "fps step: 10325 fps step and policy inference: 8127 fps total: 6868 epoch: 1153/1500\n",
            "fps step: 8768 fps step and policy inference: 6854 fps total: 5937 epoch: 1154/1500\n",
            "fps step: 8404 fps step and policy inference: 6649 fps total: 5782 epoch: 1155/1500\n",
            "fps step: 9767 fps step and policy inference: 7744 fps total: 6595 epoch: 1156/1500\n",
            "fps step: 10587 fps step and policy inference: 8366 fps total: 7040 epoch: 1157/1500\n",
            "fps step: 10413 fps step and policy inference: 8187 fps total: 6914 epoch: 1158/1500\n",
            "fps step: 11282 fps step and policy inference: 8964 fps total: 7467 epoch: 1159/1500\n",
            "fps step: 8518 fps step and policy inference: 6694 fps total: 5817 epoch: 1160/1500\n",
            "fps step: 9901 fps step and policy inference: 7828 fps total: 6656 epoch: 1161/1500\n",
            "fps step: 8234 fps step and policy inference: 6544 fps total: 5705 epoch: 1162/1500\n",
            "fps step: 10351 fps step and policy inference: 8171 fps total: 6900 epoch: 1163/1500\n",
            "fps step: 10338 fps step and policy inference: 8258 fps total: 6978 epoch: 1164/1500\n",
            "fps step: 8144 fps step and policy inference: 6288 fps total: 5513 epoch: 1165/1500\n",
            "fps step: 10132 fps step and policy inference: 7999 fps total: 6778 epoch: 1166/1500\n",
            "fps step: 10315 fps step and policy inference: 8164 fps total: 6896 epoch: 1167/1500\n",
            "fps step: 9280 fps step and policy inference: 7306 fps total: 6276 epoch: 1168/1500\n",
            "fps step: 10325 fps step and policy inference: 8107 fps total: 6855 epoch: 1169/1500\n",
            "fps step: 10758 fps step and policy inference: 8590 fps total: 7198 epoch: 1170/1500\n",
            "fps step: 9188 fps step and policy inference: 7329 fps total: 6299 epoch: 1171/1500\n",
            "fps step: 8970 fps step and policy inference: 7001 fps total: 6048 epoch: 1172/1500\n",
            "fps step: 8052 fps step and policy inference: 6273 fps total: 5499 epoch: 1173/1500\n",
            "fps step: 9240 fps step and policy inference: 7300 fps total: 6276 epoch: 1174/1500\n",
            "fps step: 9157 fps step and policy inference: 7277 fps total: 6253 epoch: 1175/1500\n",
            "fps step: 9627 fps step and policy inference: 7507 fps total: 6418 epoch: 1176/1500\n",
            "fps step: 9956 fps step and policy inference: 7960 fps total: 6750 epoch: 1177/1500\n",
            "fps step: 9337 fps step and policy inference: 7318 fps total: 6268 epoch: 1178/1500\n",
            "fps step: 9050 fps step and policy inference: 7138 fps total: 6150 epoch: 1179/1500\n",
            "fps step: 9857 fps step and policy inference: 7735 fps total: 6588 epoch: 1180/1500\n",
            "fps step: 9723 fps step and policy inference: 7618 fps total: 6501 epoch: 1181/1500\n",
            "fps step: 10551 fps step and policy inference: 8456 fps total: 7109 epoch: 1182/1500\n",
            "fps step: 9514 fps step and policy inference: 7500 fps total: 6416 epoch: 1183/1500\n",
            "fps step: 10049 fps step and policy inference: 7889 fps total: 6699 epoch: 1184/1500\n",
            "fps step: 9830 fps step and policy inference: 7770 fps total: 6615 epoch: 1185/1500\n",
            "fps step: 9892 fps step and policy inference: 7787 fps total: 6627 epoch: 1186/1500\n",
            "fps step: 10172 fps step and policy inference: 8083 fps total: 6837 epoch: 1187/1500\n",
            "fps step: 10344 fps step and policy inference: 8199 fps total: 6928 epoch: 1188/1500\n",
            "fps step: 10723 fps step and policy inference: 8482 fps total: 7122 epoch: 1189/1500\n",
            "fps step: 9931 fps step and policy inference: 7840 fps total: 6666 epoch: 1190/1500\n",
            "fps step: 9017 fps step and policy inference: 7116 fps total: 6136 epoch: 1191/1500\n",
            "fps step: 10255 fps step and policy inference: 8155 fps total: 6890 epoch: 1192/1500\n",
            "fps step: 10663 fps step and policy inference: 8495 fps total: 7131 epoch: 1193/1500\n",
            "fps step: 10276 fps step and policy inference: 8058 fps total: 6822 epoch: 1194/1500\n",
            "fps step: 9545 fps step and policy inference: 7647 fps total: 6524 epoch: 1195/1500\n",
            "fps step: 9716 fps step and policy inference: 7681 fps total: 6549 epoch: 1196/1500\n",
            "fps step: 10236 fps step and policy inference: 8152 fps total: 6889 epoch: 1197/1500\n",
            "fps step: 11097 fps step and policy inference: 8706 fps total: 7267 epoch: 1198/1500\n",
            "fps step: 8658 fps step and policy inference: 6794 fps total: 5900 epoch: 1199/1500\n",
            "fps step: 9650 fps step and policy inference: 7627 fps total: 6509 epoch: 1200/1500\n",
            "fps step: 9538 fps step and policy inference: 7499 fps total: 6417 epoch: 1201/1500\n",
            "fps step: 9938 fps step and policy inference: 7867 fps total: 6663 epoch: 1202/1500\n",
            "fps step: 8403 fps step and policy inference: 6552 fps total: 5709 epoch: 1203/1500\n",
            "fps step: 9594 fps step and policy inference: 7511 fps total: 6424 epoch: 1204/1500\n",
            "fps step: 11182 fps step and policy inference: 8965 fps total: 7433 epoch: 1205/1500\n",
            "fps step: 8698 fps step and policy inference: 6818 fps total: 5913 epoch: 1206/1500\n",
            "fps step: 9324 fps step and policy inference: 7379 fps total: 6327 epoch: 1207/1500\n",
            "fps step: 10032 fps step and policy inference: 8000 fps total: 6780 epoch: 1208/1500\n",
            "fps step: 8479 fps step and policy inference: 6712 fps total: 5830 epoch: 1209/1500\n",
            "fps step: 9089 fps step and policy inference: 7144 fps total: 6156 epoch: 1210/1500\n",
            "fps step: 10001 fps step and policy inference: 7930 fps total: 6726 epoch: 1211/1500\n",
            "fps step: 10264 fps step and policy inference: 8140 fps total: 6877 epoch: 1212/1500\n",
            "fps step: 10926 fps step and policy inference: 8697 fps total: 7268 epoch: 1213/1500\n",
            "fps step: 10678 fps step and policy inference: 8441 fps total: 7093 epoch: 1214/1500\n",
            "fps step: 9185 fps step and policy inference: 7210 fps total: 6194 epoch: 1215/1500\n",
            "fps step: 10087 fps step and policy inference: 8026 fps total: 6798 epoch: 1216/1500\n",
            "fps step: 10284 fps step and policy inference: 8145 fps total: 6884 epoch: 1217/1500\n",
            "fps step: 9313 fps step and policy inference: 7498 fps total: 6416 epoch: 1218/1500\n",
            "fps step: 9105 fps step and policy inference: 7278 fps total: 6253 epoch: 1219/1500\n",
            "fps step: 8425 fps step and policy inference: 6683 fps total: 5807 epoch: 1220/1500\n",
            "fps step: 9366 fps step and policy inference: 7508 fps total: 6423 epoch: 1221/1500\n",
            "fps step: 9086 fps step and policy inference: 7103 fps total: 6124 epoch: 1222/1500\n",
            "fps step: 10796 fps step and policy inference: 8577 fps total: 7188 epoch: 1223/1500\n",
            "fps step: 8987 fps step and policy inference: 7118 fps total: 6133 epoch: 1224/1500\n",
            "fps step: 8119 fps step and policy inference: 6392 fps total: 5590 epoch: 1225/1500\n",
            "fps step: 9350 fps step and policy inference: 7682 fps total: 6563 epoch: 1226/1500\n",
            "fps step: 8755 fps step and policy inference: 6927 fps total: 5993 epoch: 1227/1500\n",
            "fps step: 9787 fps step and policy inference: 7784 fps total: 6623 epoch: 1228/1500\n",
            "fps step: 10179 fps step and policy inference: 8122 fps total: 6824 epoch: 1229/1500\n",
            "fps step: 9720 fps step and policy inference: 7721 fps total: 6586 epoch: 1230/1500\n",
            "fps step: 8085 fps step and policy inference: 6405 fps total: 5597 epoch: 1231/1500\n",
            "fps step: 10510 fps step and policy inference: 8398 fps total: 7067 epoch: 1232/1500\n",
            "fps step: 9480 fps step and policy inference: 7497 fps total: 6417 epoch: 1233/1500\n",
            "fps step: 9539 fps step and policy inference: 7582 fps total: 6479 epoch: 1234/1500\n",
            "fps step: 10523 fps step and policy inference: 8322 fps total: 7020 epoch: 1235/1500\n",
            "fps step: 9164 fps step and policy inference: 7280 fps total: 6262 epoch: 1236/1500\n",
            "fps step: 8675 fps step and policy inference: 6890 fps total: 5965 epoch: 1237/1500\n",
            "fps step: 8750 fps step and policy inference: 7018 fps total: 6066 epoch: 1238/1500\n",
            "fps step: 10270 fps step and policy inference: 8023 fps total: 6797 epoch: 1239/1500\n",
            "fps step: 9178 fps step and policy inference: 7300 fps total: 6270 epoch: 1240/1500\n",
            "fps step: 8600 fps step and policy inference: 6895 fps total: 5970 epoch: 1241/1500\n",
            "fps step: 10562 fps step and policy inference: 8432 fps total: 7090 epoch: 1242/1500\n",
            "fps step: 8849 fps step and policy inference: 7055 fps total: 6046 epoch: 1243/1500\n",
            "fps step: 8779 fps step and policy inference: 6958 fps total: 6015 epoch: 1244/1500\n",
            "fps step: 9704 fps step and policy inference: 7822 fps total: 6648 epoch: 1245/1500\n",
            "fps step: 10002 fps step and policy inference: 7998 fps total: 6771 epoch: 1246/1500\n",
            "fps step: 8798 fps step and policy inference: 6978 fps total: 6030 epoch: 1247/1500\n",
            "fps step: 8994 fps step and policy inference: 7146 fps total: 6135 epoch: 1248/1500\n",
            "fps step: 9571 fps step and policy inference: 7626 fps total: 6485 epoch: 1249/1500\n",
            "fps step: 10156 fps step and policy inference: 8143 fps total: 6883 epoch: 1250/1500\n",
            "fps step: 8555 fps step and policy inference: 6740 fps total: 5844 epoch: 1251/1500\n",
            "fps step: 9082 fps step and policy inference: 7326 fps total: 6288 epoch: 1252/1500\n",
            "fps step: 8397 fps step and policy inference: 6657 fps total: 5794 epoch: 1253/1500\n",
            "fps step: 9842 fps step and policy inference: 7823 fps total: 6651 epoch: 1254/1500\n",
            "fps step: 9709 fps step and policy inference: 7780 fps total: 6629 epoch: 1255/1500\n",
            "fps step: 9124 fps step and policy inference: 7333 fps total: 6302 epoch: 1256/1500\n",
            "fps step: 7466 fps step and policy inference: 5815 fps total: 5141 epoch: 1257/1500\n",
            "fps step: 8198 fps step and policy inference: 6478 fps total: 5652 epoch: 1258/1500\n",
            "fps step: 10525 fps step and policy inference: 8434 fps total: 7092 epoch: 1259/1500\n",
            "fps step: 9044 fps step and policy inference: 7254 fps total: 6206 epoch: 1260/1500\n",
            "fps step: 11139 fps step and policy inference: 8824 fps total: 7373 epoch: 1261/1500\n",
            "fps step: 9884 fps step and policy inference: 7943 fps total: 6752 epoch: 1262/1500\n",
            "fps step: 7708 fps step and policy inference: 6117 fps total: 5378 epoch: 1263/1500\n",
            "fps step: 9372 fps step and policy inference: 7418 fps total: 6357 epoch: 1264/1500\n",
            "fps step: 9518 fps step and policy inference: 7559 fps total: 6461 epoch: 1265/1500\n",
            "fps step: 10243 fps step and policy inference: 8224 fps total: 6941 epoch: 1266/1500\n",
            "fps step: 9414 fps step and policy inference: 7463 fps total: 6386 epoch: 1267/1500\n",
            "fps step: 8728 fps step and policy inference: 6857 fps total: 5943 epoch: 1268/1500\n",
            "fps step: 8136 fps step and policy inference: 6370 fps total: 5572 epoch: 1269/1500\n",
            "fps step: 8398 fps step and policy inference: 6464 fps total: 5634 epoch: 1270/1500\n",
            "fps step: 11085 fps step and policy inference: 8830 fps total: 7367 epoch: 1271/1500\n",
            "fps step: 9697 fps step and policy inference: 7653 fps total: 6530 epoch: 1272/1500\n",
            "fps step: 8961 fps step and policy inference: 7009 fps total: 6056 epoch: 1273/1500\n",
            "fps step: 9288 fps step and policy inference: 7334 fps total: 6295 epoch: 1274/1500\n",
            "fps step: 9301 fps step and policy inference: 7294 fps total: 6267 epoch: 1275/1500\n",
            "fps step: 11132 fps step and policy inference: 8844 fps total: 7384 epoch: 1276/1500\n",
            "fps step: 9958 fps step and policy inference: 7975 fps total: 6766 epoch: 1277/1500\n",
            "fps step: 8294 fps step and policy inference: 6390 fps total: 5590 epoch: 1278/1500\n",
            "fps step: 9425 fps step and policy inference: 7400 fps total: 6352 epoch: 1279/1500\n",
            "fps step: 9297 fps step and policy inference: 7430 fps total: 6372 epoch: 1280/1500\n",
            "fps step: 9640 fps step and policy inference: 7595 fps total: 6485 epoch: 1281/1500\n",
            "fps step: 9960 fps step and policy inference: 7909 fps total: 6714 epoch: 1282/1500\n",
            "fps step: 10946 fps step and policy inference: 8703 fps total: 7265 epoch: 1283/1500\n",
            "fps step: 8842 fps step and policy inference: 7029 fps total: 6074 epoch: 1284/1500\n",
            "fps step: 10187 fps step and policy inference: 8084 fps total: 6846 epoch: 1285/1500\n",
            "fps step: 10204 fps step and policy inference: 8182 fps total: 6890 epoch: 1286/1500\n",
            "fps step: 9694 fps step and policy inference: 7752 fps total: 6602 epoch: 1287/1500\n",
            "fps step: 9911 fps step and policy inference: 7884 fps total: 6697 epoch: 1288/1500\n",
            "fps step: 9049 fps step and policy inference: 7234 fps total: 6222 epoch: 1289/1500\n",
            "fps step: 10098 fps step and policy inference: 8084 fps total: 6842 epoch: 1290/1500\n",
            "fps step: 9172 fps step and policy inference: 7296 fps total: 6264 epoch: 1291/1500\n",
            "fps step: 8809 fps step and policy inference: 7028 fps total: 6067 epoch: 1292/1500\n",
            "fps step: 10637 fps step and policy inference: 8314 fps total: 6982 epoch: 1293/1500\n",
            "fps step: 9074 fps step and policy inference: 7131 fps total: 6146 epoch: 1294/1500\n",
            "fps step: 10338 fps step and policy inference: 8125 fps total: 6842 epoch: 1295/1500\n",
            "fps step: 9558 fps step and policy inference: 7451 fps total: 6379 epoch: 1296/1500\n",
            "fps step: 10053 fps step and policy inference: 7902 fps total: 6712 epoch: 1297/1500\n",
            "fps step: 9171 fps step and policy inference: 7234 fps total: 6220 epoch: 1298/1500\n",
            "fps step: 9512 fps step and policy inference: 7611 fps total: 6498 epoch: 1299/1500\n",
            "fps step: 10103 fps step and policy inference: 8059 fps total: 6823 epoch: 1300/1500\n",
            "fps step: 8922 fps step and policy inference: 6992 fps total: 6040 epoch: 1301/1500\n",
            "fps step: 9920 fps step and policy inference: 7829 fps total: 6639 epoch: 1302/1500\n",
            "fps step: 8928 fps step and policy inference: 6942 fps total: 6005 epoch: 1303/1500\n",
            "fps step: 10702 fps step and policy inference: 8446 fps total: 7098 epoch: 1304/1500\n",
            "fps step: 11239 fps step and policy inference: 8833 fps total: 7369 epoch: 1305/1500\n",
            "fps step: 10395 fps step and policy inference: 8203 fps total: 6914 epoch: 1306/1500\n",
            "fps step: 8452 fps step and policy inference: 6684 fps total: 5810 epoch: 1307/1500\n",
            "fps step: 9915 fps step and policy inference: 7929 fps total: 6730 epoch: 1308/1500\n",
            "fps step: 9285 fps step and policy inference: 7401 fps total: 6343 epoch: 1309/1500\n",
            "fps step: 9652 fps step and policy inference: 7606 fps total: 6493 epoch: 1310/1500\n",
            "fps step: 10251 fps step and policy inference: 8240 fps total: 6951 epoch: 1311/1500\n",
            "fps step: 9079 fps step and policy inference: 7187 fps total: 6195 epoch: 1312/1500\n",
            "fps step: 9674 fps step and policy inference: 7541 fps total: 6447 epoch: 1313/1500\n",
            "fps step: 9662 fps step and policy inference: 7670 fps total: 6541 epoch: 1314/1500\n",
            "fps step: 9133 fps step and policy inference: 7177 fps total: 6185 epoch: 1315/1500\n",
            "fps step: 9734 fps step and policy inference: 7652 fps total: 6526 epoch: 1316/1500\n",
            "fps step: 10349 fps step and policy inference: 8284 fps total: 6983 epoch: 1317/1500\n",
            "fps step: 8847 fps step and policy inference: 6918 fps total: 5987 epoch: 1318/1500\n",
            "fps step: 9869 fps step and policy inference: 7843 fps total: 6644 epoch: 1319/1500\n",
            "fps step: 9547 fps step and policy inference: 7488 fps total: 6414 epoch: 1320/1500\n",
            "fps step: 9683 fps step and policy inference: 7556 fps total: 6458 epoch: 1321/1500\n",
            "fps step: 8682 fps step and policy inference: 6744 fps total: 5856 epoch: 1322/1500\n",
            "fps step: 8761 fps step and policy inference: 6809 fps total: 5889 epoch: 1323/1500\n",
            "fps step: 9972 fps step and policy inference: 7907 fps total: 6727 epoch: 1324/1500\n",
            "fps step: 9092 fps step and policy inference: 7298 fps total: 6269 epoch: 1325/1500\n",
            "fps step: 9460 fps step and policy inference: 7389 fps total: 6341 epoch: 1326/1500\n",
            "fps step: 10777 fps step and policy inference: 8550 fps total: 7176 epoch: 1327/1500\n",
            "fps step: 9708 fps step and policy inference: 7768 fps total: 6614 epoch: 1328/1500\n",
            "fps step: 8862 fps step and policy inference: 6881 fps total: 5963 epoch: 1329/1500\n",
            "fps step: 9157 fps step and policy inference: 7199 fps total: 6197 epoch: 1330/1500\n",
            "fps step: 9555 fps step and policy inference: 7577 fps total: 6476 epoch: 1331/1500\n",
            "fps step: 10039 fps step and policy inference: 7865 fps total: 6681 epoch: 1332/1500\n",
            "fps step: 8975 fps step and policy inference: 7044 fps total: 6077 epoch: 1333/1500\n",
            "fps step: 9790 fps step and policy inference: 7811 fps total: 6648 epoch: 1334/1500\n",
            "fps step: 10558 fps step and policy inference: 8305 fps total: 7001 epoch: 1335/1500\n",
            "fps step: 9680 fps step and policy inference: 7632 fps total: 6522 epoch: 1336/1500\n",
            "fps step: 10539 fps step and policy inference: 8213 fps total: 6933 epoch: 1337/1500\n",
            "fps step: 9603 fps step and policy inference: 7592 fps total: 6492 epoch: 1338/1500\n",
            "fps step: 10512 fps step and policy inference: 8289 fps total: 6954 epoch: 1339/1500\n",
            "fps step: 10099 fps step and policy inference: 7911 fps total: 6715 epoch: 1340/1500\n",
            "fps step: 10330 fps step and policy inference: 8025 fps total: 6797 epoch: 1341/1500\n",
            "fps step: 9605 fps step and policy inference: 7663 fps total: 6528 epoch: 1342/1500\n",
            "fps step: 8403 fps step and policy inference: 6655 fps total: 5792 epoch: 1343/1500\n",
            "fps step: 9530 fps step and policy inference: 7666 fps total: 6541 epoch: 1344/1500\n",
            "fps step: 9362 fps step and policy inference: 7352 fps total: 6314 epoch: 1345/1500\n",
            "fps step: 9624 fps step and policy inference: 7728 fps total: 6587 epoch: 1346/1500\n",
            "fps step: 9853 fps step and policy inference: 7817 fps total: 6638 epoch: 1347/1500\n",
            "fps step: 10151 fps step and policy inference: 7962 fps total: 6753 epoch: 1348/1500\n",
            "fps step: 10124 fps step and policy inference: 7994 fps total: 6766 epoch: 1349/1500\n",
            "fps step: 9774 fps step and policy inference: 7859 fps total: 6679 epoch: 1350/1500\n",
            "fps step: 9437 fps step and policy inference: 7461 fps total: 6388 epoch: 1351/1500\n",
            "fps step: 10064 fps step and policy inference: 7919 fps total: 6711 epoch: 1352/1500\n",
            "fps step: 9908 fps step and policy inference: 7727 fps total: 6571 epoch: 1353/1500\n",
            "fps step: 8788 fps step and policy inference: 6803 fps total: 5903 epoch: 1354/1500\n",
            "fps step: 11135 fps step and policy inference: 8751 fps total: 7313 epoch: 1355/1500\n",
            "fps step: 9600 fps step and policy inference: 7572 fps total: 6470 epoch: 1356/1500\n",
            "fps step: 10715 fps step and policy inference: 8558 fps total: 7178 epoch: 1357/1500\n",
            "fps step: 9642 fps step and policy inference: 7678 fps total: 6549 epoch: 1358/1500\n",
            "fps step: 11075 fps step and policy inference: 8817 fps total: 7363 epoch: 1359/1500\n",
            "fps step: 9176 fps step and policy inference: 7158 fps total: 6166 epoch: 1360/1500\n",
            "fps step: 9310 fps step and policy inference: 7352 fps total: 6302 epoch: 1361/1500\n",
            "fps step: 9255 fps step and policy inference: 7230 fps total: 6220 epoch: 1362/1500\n",
            "fps step: 9753 fps step and policy inference: 7708 fps total: 6570 epoch: 1363/1500\n",
            "fps step: 9615 fps step and policy inference: 7529 fps total: 6438 epoch: 1364/1500\n",
            "fps step: 10302 fps step and policy inference: 8144 fps total: 6884 epoch: 1365/1500\n",
            "fps step: 9827 fps step and policy inference: 7857 fps total: 6651 epoch: 1366/1500\n",
            "fps step: 10240 fps step and policy inference: 8028 fps total: 6799 epoch: 1367/1500\n",
            "fps step: 9543 fps step and policy inference: 7560 fps total: 6462 epoch: 1368/1500\n",
            "fps step: 9227 fps step and policy inference: 7244 fps total: 6227 epoch: 1369/1500\n",
            "fps step: 10012 fps step and policy inference: 7949 fps total: 6741 epoch: 1370/1500\n",
            "fps step: 8941 fps step and policy inference: 6994 fps total: 6046 epoch: 1371/1500\n",
            "fps step: 9693 fps step and policy inference: 7653 fps total: 6534 epoch: 1372/1500\n",
            "fps step: 9076 fps step and policy inference: 7323 fps total: 6285 epoch: 1373/1500\n",
            "fps step: 10021 fps step and policy inference: 8061 fps total: 6812 epoch: 1374/1500\n",
            "fps step: 9922 fps step and policy inference: 7812 fps total: 6633 epoch: 1375/1500\n",
            "fps step: 8476 fps step and policy inference: 6599 fps total: 5750 epoch: 1376/1500\n",
            "fps step: 10252 fps step and policy inference: 8091 fps total: 6844 epoch: 1377/1500\n",
            "fps step: 10727 fps step and policy inference: 8561 fps total: 7180 epoch: 1378/1500\n",
            "fps step: 7882 fps step and policy inference: 6093 fps total: 5348 epoch: 1379/1500\n",
            "fps step: 8933 fps step and policy inference: 6970 fps total: 6025 epoch: 1380/1500\n",
            "fps step: 10517 fps step and policy inference: 8244 fps total: 6953 epoch: 1381/1500\n",
            "fps step: 9634 fps step and policy inference: 7557 fps total: 6451 epoch: 1382/1500\n",
            "fps step: 11736 fps step and policy inference: 9341 fps total: 7696 epoch: 1383/1500\n",
            "fps step: 9801 fps step and policy inference: 7948 fps total: 6749 epoch: 1384/1500\n",
            "fps step: 9914 fps step and policy inference: 7798 fps total: 6622 epoch: 1385/1500\n",
            "fps step: 9993 fps step and policy inference: 7910 fps total: 6716 epoch: 1386/1500\n",
            "fps step: 9625 fps step and policy inference: 7589 fps total: 6481 epoch: 1387/1500\n",
            "fps step: 10526 fps step and policy inference: 8382 fps total: 7052 epoch: 1388/1500\n",
            "fps step: 10519 fps step and policy inference: 8315 fps total: 7006 epoch: 1389/1500\n",
            "fps step: 8891 fps step and policy inference: 7042 fps total: 6065 epoch: 1390/1500\n",
            "fps step: 10608 fps step and policy inference: 8421 fps total: 7083 epoch: 1391/1500\n",
            "fps step: 9295 fps step and policy inference: 7250 fps total: 6234 epoch: 1392/1500\n",
            "fps step: 8993 fps step and policy inference: 7008 fps total: 6035 epoch: 1393/1500\n",
            "fps step: 9619 fps step and policy inference: 7518 fps total: 6430 epoch: 1394/1500\n",
            "fps step: 9738 fps step and policy inference: 7626 fps total: 6491 epoch: 1395/1500\n",
            "fps step: 8274 fps step and policy inference: 6466 fps total: 5647 epoch: 1396/1500\n",
            "fps step: 9097 fps step and policy inference: 7045 fps total: 6082 epoch: 1397/1500\n",
            "fps step: 10321 fps step and policy inference: 8220 fps total: 6938 epoch: 1398/1500\n",
            "fps step: 9485 fps step and policy inference: 7485 fps total: 6412 epoch: 1399/1500\n",
            "fps step: 11534 fps step and policy inference: 9162 fps total: 7596 epoch: 1400/1500\n",
            "fps step: 11105 fps step and policy inference: 8792 fps total: 7341 epoch: 1401/1500\n",
            "fps step: 8409 fps step and policy inference: 6472 fps total: 5629 epoch: 1402/1500\n",
            "fps step: 9876 fps step and policy inference: 7870 fps total: 6687 epoch: 1403/1500\n",
            "fps step: 9532 fps step and policy inference: 7511 fps total: 6426 epoch: 1404/1500\n",
            "fps step: 9792 fps step and policy inference: 7816 fps total: 6647 epoch: 1405/1500\n",
            "fps step: 10924 fps step and policy inference: 8651 fps total: 7243 epoch: 1406/1500\n",
            "fps step: 9970 fps step and policy inference: 7987 fps total: 6772 epoch: 1407/1500\n",
            "fps step: 10609 fps step and policy inference: 8388 fps total: 7059 epoch: 1408/1500\n",
            "fps step: 9882 fps step and policy inference: 7847 fps total: 6672 epoch: 1409/1500\n",
            "fps step: 9289 fps step and policy inference: 7171 fps total: 6174 epoch: 1410/1500\n",
            "fps step: 9990 fps step and policy inference: 7984 fps total: 6768 epoch: 1411/1500\n",
            "fps step: 11173 fps step and policy inference: 8803 fps total: 7349 epoch: 1412/1500\n",
            "fps step: 9709 fps step and policy inference: 7656 fps total: 6533 epoch: 1413/1500\n",
            "fps step: 8603 fps step and policy inference: 6777 fps total: 5882 epoch: 1414/1500\n",
            "fps step: 9168 fps step and policy inference: 7195 fps total: 6175 epoch: 1415/1500\n",
            "fps step: 9854 fps step and policy inference: 7848 fps total: 6670 epoch: 1416/1500\n",
            "fps step: 8090 fps step and policy inference: 6347 fps total: 5554 epoch: 1417/1500\n",
            "fps step: 10163 fps step and policy inference: 7965 fps total: 6758 epoch: 1418/1500\n",
            "fps step: 10415 fps step and policy inference: 8180 fps total: 6913 epoch: 1419/1500\n",
            "fps step: 10105 fps step and policy inference: 7940 fps total: 6739 epoch: 1420/1500\n",
            "fps step: 10777 fps step and policy inference: 8619 fps total: 7224 epoch: 1421/1500\n",
            "fps step: 8949 fps step and policy inference: 7006 fps total: 6049 epoch: 1422/1500\n",
            "fps step: 10163 fps step and policy inference: 7941 fps total: 6737 epoch: 1423/1500\n",
            "fps step: 9110 fps step and policy inference: 7186 fps total: 6186 epoch: 1424/1500\n",
            "fps step: 9823 fps step and policy inference: 7730 fps total: 6587 epoch: 1425/1500\n",
            "fps step: 9785 fps step and policy inference: 7683 fps total: 6551 epoch: 1426/1500\n",
            "fps step: 9999 fps step and policy inference: 7878 fps total: 6695 epoch: 1427/1500\n",
            "fps step: 9790 fps step and policy inference: 7803 fps total: 6637 epoch: 1428/1500\n",
            "fps step: 9986 fps step and policy inference: 7872 fps total: 6688 epoch: 1429/1500\n",
            "fps step: 8969 fps step and policy inference: 7094 fps total: 6119 epoch: 1430/1500\n",
            "fps step: 10210 fps step and policy inference: 8200 fps total: 6914 epoch: 1431/1500\n",
            "fps step: 9213 fps step and policy inference: 7078 fps total: 6098 epoch: 1432/1500\n",
            "fps step: 9545 fps step and policy inference: 7473 fps total: 6386 epoch: 1433/1500\n",
            "fps step: 9519 fps step and policy inference: 7605 fps total: 6503 epoch: 1434/1500\n",
            "fps step: 10029 fps step and policy inference: 8005 fps total: 6783 epoch: 1435/1500\n",
            "fps step: 9224 fps step and policy inference: 7298 fps total: 6269 epoch: 1436/1500\n",
            "fps step: 10343 fps step and policy inference: 8174 fps total: 6885 epoch: 1437/1500\n",
            "fps step: 10041 fps step and policy inference: 7863 fps total: 6681 epoch: 1438/1500\n",
            "fps step: 10178 fps step and policy inference: 8061 fps total: 6827 epoch: 1439/1500\n",
            "fps step: 8837 fps step and policy inference: 6918 fps total: 5972 epoch: 1440/1500\n",
            "fps step: 9305 fps step and policy inference: 7332 fps total: 6292 epoch: 1441/1500\n",
            "fps step: 9481 fps step and policy inference: 7335 fps total: 6301 epoch: 1442/1500\n",
            "fps step: 10414 fps step and policy inference: 8296 fps total: 6991 epoch: 1443/1500\n",
            "fps step: 9989 fps step and policy inference: 7980 fps total: 6767 epoch: 1444/1500\n",
            "fps step: 10269 fps step and policy inference: 8093 fps total: 6847 epoch: 1445/1500\n",
            "fps step: 10481 fps step and policy inference: 8365 fps total: 7042 epoch: 1446/1500\n",
            "fps step: 9861 fps step and policy inference: 7822 fps total: 6649 epoch: 1447/1500\n",
            "fps step: 10607 fps step and policy inference: 8350 fps total: 7024 epoch: 1448/1500\n",
            "fps step: 10750 fps step and policy inference: 8371 fps total: 7043 epoch: 1449/1500\n",
            "fps step: 10458 fps step and policy inference: 8259 fps total: 6967 epoch: 1450/1500\n",
            "fps step: 11213 fps step and policy inference: 8849 fps total: 7377 epoch: 1451/1500\n",
            "fps step: 9717 fps step and policy inference: 7562 fps total: 6468 epoch: 1452/1500\n",
            "fps step: 11493 fps step and policy inference: 9068 fps total: 7532 epoch: 1453/1500\n",
            "fps step: 10553 fps step and policy inference: 8381 fps total: 7044 epoch: 1454/1500\n",
            "fps step: 10594 fps step and policy inference: 8317 fps total: 7019 epoch: 1455/1500\n",
            "fps step: 10039 fps step and policy inference: 7889 fps total: 6700 epoch: 1456/1500\n",
            "fps step: 11001 fps step and policy inference: 8772 fps total: 7327 epoch: 1457/1500\n",
            "fps step: 9552 fps step and policy inference: 7344 fps total: 6302 epoch: 1458/1500\n",
            "fps step: 10889 fps step and policy inference: 8478 fps total: 7116 epoch: 1459/1500\n",
            "fps step: 10383 fps step and policy inference: 8324 fps total: 7014 epoch: 1460/1500\n",
            "fps step: 9435 fps step and policy inference: 7418 fps total: 6357 epoch: 1461/1500\n",
            "fps step: 10711 fps step and policy inference: 8472 fps total: 7119 epoch: 1462/1500\n",
            "fps step: 9338 fps step and policy inference: 7231 fps total: 6197 epoch: 1463/1500\n",
            "fps step: 9975 fps step and policy inference: 7819 fps total: 6630 epoch: 1464/1500\n",
            "fps step: 10224 fps step and policy inference: 8180 fps total: 6916 epoch: 1465/1500\n",
            "fps step: 9808 fps step and policy inference: 7723 fps total: 6581 epoch: 1466/1500\n",
            "fps step: 10425 fps step and policy inference: 8263 fps total: 6969 epoch: 1467/1500\n",
            "fps step: 10491 fps step and policy inference: 8360 fps total: 7037 epoch: 1468/1500\n",
            "fps step: 10278 fps step and policy inference: 8093 fps total: 6845 epoch: 1469/1500\n",
            "fps step: 10932 fps step and policy inference: 8673 fps total: 7261 epoch: 1470/1500\n",
            "fps step: 9288 fps step and policy inference: 7351 fps total: 6314 epoch: 1471/1500\n",
            "fps step: 10106 fps step and policy inference: 8029 fps total: 6805 epoch: 1472/1500\n",
            "fps step: 10236 fps step and policy inference: 8015 fps total: 6796 epoch: 1473/1500\n",
            "fps step: 10492 fps step and policy inference: 8223 fps total: 6940 epoch: 1474/1500\n",
            "fps step: 9656 fps step and policy inference: 7590 fps total: 6484 epoch: 1475/1500\n",
            "fps step: 10833 fps step and policy inference: 8513 fps total: 7140 epoch: 1476/1500\n",
            "fps step: 9279 fps step and policy inference: 7231 fps total: 6227 epoch: 1477/1500\n",
            "saving next best rewards:  [101.35467]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 10157 fps step and policy inference: 7973 fps total: 6762 epoch: 1478/1500\n",
            "fps step: 9341 fps step and policy inference: 7423 fps total: 6364 epoch: 1479/1500\n",
            "fps step: 9767 fps step and policy inference: 7731 fps total: 6586 epoch: 1480/1500\n",
            "fps step: 10088 fps step and policy inference: 7949 fps total: 6742 epoch: 1481/1500\n",
            "fps step: 8824 fps step and policy inference: 7014 fps total: 6041 epoch: 1482/1500\n",
            "fps step: 10540 fps step and policy inference: 8485 fps total: 7125 epoch: 1483/1500\n",
            "fps step: 9838 fps step and policy inference: 7659 fps total: 6535 epoch: 1484/1500\n",
            "fps step: 11216 fps step and policy inference: 8842 fps total: 7387 epoch: 1485/1500\n",
            "fps step: 10265 fps step and policy inference: 8172 fps total: 6877 epoch: 1486/1500\n",
            "fps step: 10528 fps step and policy inference: 8202 fps total: 6926 epoch: 1487/1500\n",
            "fps step: 10432 fps step and policy inference: 8248 fps total: 6967 epoch: 1488/1500\n",
            "fps step: 9970 fps step and policy inference: 7903 fps total: 6717 epoch: 1489/1500\n",
            "fps step: 11418 fps step and policy inference: 9016 fps total: 7495 epoch: 1490/1500\n",
            "fps step: 9970 fps step and policy inference: 7881 fps total: 6695 epoch: 1491/1500\n",
            "fps step: 9412 fps step and policy inference: 7361 fps total: 6313 epoch: 1492/1500\n",
            "fps step: 10358 fps step and policy inference: 8238 fps total: 6949 epoch: 1493/1500\n",
            "fps step: 10282 fps step and policy inference: 8062 fps total: 6826 epoch: 1494/1500\n",
            "fps step: 10922 fps step and policy inference: 8583 fps total: 7196 epoch: 1495/1500\n",
            "fps step: 9082 fps step and policy inference: 7072 fps total: 6101 epoch: 1496/1500\n",
            "fps step: 9564 fps step and policy inference: 7629 fps total: 6512 epoch: 1497/1500\n",
            "fps step: 9908 fps step and policy inference: 7884 fps total: 6702 epoch: 1498/1500\n",
            "saving next best rewards:  [103.26936]\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/Breakout_envpool.pth'\n",
            "fps step: 9820 fps step and policy inference: 7647 fps total: 6525 epoch: 1499/1500\n",
            "fps step: 10937 fps step and policy inference: 8670 fps total: 7253 epoch: 1500/1500\n",
            "=> saving checkpoint 'runs/Breakout_envpool_23-10-01-59/nn/last_Breakout_envpoolep1500rew[96.06702].pth'\n",
            "MAX EPOCHS NUM!\n"
          ]
        }
      ]
    }
  ]
}